Repository: autoscrape-labs/pydoll
Branch: main
Commit: 9e236b887ab7
Files: 464
Total size: 5.0 MB

Directory structure:
gitextract_ulcsxv0t/

├── .github/
│   ├── FUNDING.yml
│   ├── ISSUE_TEMPLATE/
│   │   ├── bug_report.yml
│   │   ├── config.yml
│   │   ├── documentation.yml
│   │   ├── feature_request.yml
│   │   └── refactoring.yml
│   ├── PULL_REQUEST_TEMPLATE/
│   │   ├── bug_fix.md
│   │   ├── refactoring.md
│   │   └── release.md
│   ├── pull_request_template.md
│   └── workflows/
│       ├── deploy-docs.yml
│       ├── mypy.yml
│       ├── publish.yml
│       ├── release.yml
│       ├── ruff-ci.yml
│       └── tests.yml
├── .gitignore
├── .python-version
├── CHANGELOG.md
├── CONTRIBUTING.md
├── LICENSE
├── README.md
├── README_zh.md
├── SPONSORS.md
├── codecov.yml
├── cz.yaml
├── docs/
│   ├── en/
│   │   ├── api/
│   │   │   ├── browser/
│   │   │   │   ├── chrome.md
│   │   │   │   ├── edge.md
│   │   │   │   ├── managers.md
│   │   │   │   ├── options.md
│   │   │   │   ├── requests.md
│   │   │   │   └── tab.md
│   │   │   ├── commands/
│   │   │   │   ├── browser.md
│   │   │   │   ├── dom.md
│   │   │   │   ├── fetch.md
│   │   │   │   ├── index.md
│   │   │   │   ├── input.md
│   │   │   │   ├── network.md
│   │   │   │   ├── page.md
│   │   │   │   ├── runtime.md
│   │   │   │   ├── storage.md
│   │   │   │   └── target.md
│   │   │   ├── connection/
│   │   │   │   ├── connection.md
│   │   │   │   └── managers.md
│   │   │   ├── core/
│   │   │   │   ├── constants.md
│   │   │   │   ├── exceptions.md
│   │   │   │   └── utils.md
│   │   │   ├── elements/
│   │   │   │   ├── mixins.md
│   │   │   │   ├── shadow_root.md
│   │   │   │   └── web_element.md
│   │   │   ├── index.md
│   │   │   └── protocol/
│   │   │       ├── base.md
│   │   │       ├── browser.md
│   │   │       ├── dom.md
│   │   │       ├── fetch.md
│   │   │       ├── input.md
│   │   │       ├── network.md
│   │   │       ├── page.md
│   │   │       ├── runtime.md
│   │   │       ├── storage.md
│   │   │       └── target.md
│   │   ├── deep-dive/
│   │   │   ├── architecture/
│   │   │   │   ├── browser-domain.md
│   │   │   │   ├── browser-requests-architecture.md
│   │   │   │   ├── event-architecture.md
│   │   │   │   ├── find-elements-mixin.md
│   │   │   │   ├── index.md
│   │   │   │   ├── shadow-dom.md
│   │   │   │   ├── tab-domain.md
│   │   │   │   └── webelement-domain.md
│   │   │   ├── fingerprinting/
│   │   │   │   ├── behavioral-fingerprinting.md
│   │   │   │   ├── browser-fingerprinting.md
│   │   │   │   ├── evasion-techniques.md
│   │   │   │   ├── index.md
│   │   │   │   └── network-fingerprinting.md
│   │   │   ├── fundamentals/
│   │   │   │   ├── cdp.md
│   │   │   │   ├── connection-layer.md
│   │   │   │   ├── iframes-and-contexts.md
│   │   │   │   ├── index.md
│   │   │   │   └── typing-system.md
│   │   │   ├── guides/
│   │   │   │   ├── index.md
│   │   │   │   └── selectors-guide.md
│   │   │   ├── index.md
│   │   │   └── network/
│   │   │       ├── build-proxy.md
│   │   │       ├── http-proxies.md
│   │   │       ├── index.md
│   │   │       ├── network-fundamentals.md
│   │   │       ├── proxy-detection.md
│   │   │       ├── proxy-legal.md
│   │   │       └── socks-proxies.md
│   │   ├── features/
│   │   │   ├── advanced/
│   │   │   │   ├── behavioral-captcha-bypass.md
│   │   │   │   ├── decorators.md
│   │   │   │   ├── event-system.md
│   │   │   │   └── remote-connections.md
│   │   │   ├── automation/
│   │   │   │   ├── file-operations.md
│   │   │   │   ├── human-interactions.md
│   │   │   │   ├── iframes.md
│   │   │   │   ├── keyboard-control.md
│   │   │   │   ├── mouse-control.md
│   │   │   │   └── screenshots-and-pdfs.md
│   │   │   ├── browser-management/
│   │   │   │   ├── contexts.md
│   │   │   │   ├── cookies-sessions.md
│   │   │   │   └── tabs.md
│   │   │   ├── configuration/
│   │   │   │   ├── browser-options.md
│   │   │   │   ├── browser-preferences.md
│   │   │   │   └── proxy.md
│   │   │   ├── core-concepts.md
│   │   │   ├── element-finding.md
│   │   │   ├── index.md
│   │   │   └── network/
│   │   │       ├── http-requests.md
│   │   │       ├── interception.md
│   │   │       ├── monitoring.md
│   │   │       └── network-recording.md
│   │   └── index.md
│   ├── pt/
│   │   ├── api/
│   │   │   ├── browser/
│   │   │   │   ├── chrome.md
│   │   │   │   ├── edge.md
│   │   │   │   ├── managers.md
│   │   │   │   ├── options.md
│   │   │   │   ├── requests.md
│   │   │   │   └── tab.md
│   │   │   ├── commands/
│   │   │   │   ├── browser.md
│   │   │   │   ├── dom.md
│   │   │   │   ├── fetch.md
│   │   │   │   ├── index.md
│   │   │   │   ├── input.md
│   │   │   │   ├── network.md
│   │   │   │   ├── page.md
│   │   │   │   ├── runtime.md
│   │   │   │   ├── storage.md
│   │   │   │   └── target.md
│   │   │   ├── connection/
│   │   │   │   ├── connection.md
│   │   │   │   └── managers.md
│   │   │   ├── core/
│   │   │   │   ├── constants.md
│   │   │   │   ├── exceptions.md
│   │   │   │   └── utils.md
│   │   │   ├── elements/
│   │   │   │   ├── mixins.md
│   │   │   │   ├── shadow_root.md
│   │   │   │   └── web_element.md
│   │   │   ├── index.md
│   │   │   └── protocol/
│   │   │       ├── base.md
│   │   │       ├── browser.md
│   │   │       ├── dom.md
│   │   │       ├── fetch.md
│   │   │       ├── input.md
│   │   │       ├── network.md
│   │   │       ├── page.md
│   │   │       ├── runtime.md
│   │   │       ├── storage.md
│   │   │       └── target.md
│   │   ├── deep-dive/
│   │   │   ├── architecture/
│   │   │   │   ├── browser-domain.md
│   │   │   │   ├── browser-requests-architecture.md
│   │   │   │   ├── event-architecture.md
│   │   │   │   ├── find-elements-mixin.md
│   │   │   │   ├── index.md
│   │   │   │   ├── shadow-dom.md
│   │   │   │   ├── tab-domain.md
│   │   │   │   └── webelement-domain.md
│   │   │   ├── fingerprinting/
│   │   │   │   ├── behavioral-fingerprinting.md
│   │   │   │   ├── browser-fingerprinting.md
│   │   │   │   ├── evasion-techniques.md
│   │   │   │   ├── index.md
│   │   │   │   └── network-fingerprinting.md
│   │   │   ├── fundamentals/
│   │   │   │   ├── cdp.md
│   │   │   │   ├── connection-layer.md
│   │   │   │   ├── iframes-and-contexts.md
│   │   │   │   ├── index.md
│   │   │   │   └── typing-system.md
│   │   │   ├── guides/
│   │   │   │   ├── index.md
│   │   │   │   └── selectors-guide.md
│   │   │   ├── index.md
│   │   │   └── network/
│   │   │       ├── build-proxy.md
│   │   │       ├── http-proxies.md
│   │   │       ├── index.md
│   │   │       ├── network-fundamentals.md
│   │   │       ├── proxy-detection.md
│   │   │       ├── proxy-legal.md
│   │   │       └── socks-proxies.md
│   │   ├── features/
│   │   │   ├── advanced/
│   │   │   │   ├── behavioral-captcha-bypass.md
│   │   │   │   ├── decorators.md
│   │   │   │   ├── event-system.md
│   │   │   │   └── remote-connections.md
│   │   │   ├── automation/
│   │   │   │   ├── file-operations.md
│   │   │   │   ├── human-interactions.md
│   │   │   │   ├── iframes.md
│   │   │   │   ├── keyboard-control.md
│   │   │   │   ├── mouse-control.md
│   │   │   │   └── screenshots-and-pdfs.md
│   │   │   ├── browser-management/
│   │   │   │   ├── contexts.md
│   │   │   │   ├── cookies-sessions.md
│   │   │   │   └── tabs.md
│   │   │   ├── configuration/
│   │   │   │   ├── browser-options.md
│   │   │   │   ├── browser-preferences.md
│   │   │   │   └── proxy.md
│   │   │   ├── core-concepts.md
│   │   │   ├── element-finding.md
│   │   │   ├── index.md
│   │   │   └── network/
│   │   │       ├── http-requests.md
│   │   │       ├── interception.md
│   │   │       ├── monitoring.md
│   │   │       └── network-recording.md
│   │   └── index.md
│   ├── resources/
│   │   ├── scripts/
│   │   │   ├── extra.js
│   │   │   └── termynal.js
│   │   └── stylesheets/
│   │       ├── extra.css
│   │       └── termynal.css
│   └── zh/
│       ├── api/
│       │   ├── browser/
│       │   │   ├── chrome.md
│       │   │   ├── edge.md
│       │   │   ├── managers.md
│       │   │   ├── options.md
│       │   │   ├── requests.md
│       │   │   └── tab.md
│       │   ├── commands/
│       │   │   ├── browser.md
│       │   │   ├── dom.md
│       │   │   ├── fetch.md
│       │   │   ├── index.md
│       │   │   ├── input.md
│       │   │   ├── network.md
│       │   │   ├── page.md
│       │   │   ├── runtime.md
│       │   │   ├── storage.md
│       │   │   └── target.md
│       │   ├── connection/
│       │   │   ├── connection.md
│       │   │   └── managers.md
│       │   ├── core/
│       │   │   ├── constants.md
│       │   │   ├── exceptions.md
│       │   │   └── utils.md
│       │   ├── elements/
│       │   │   ├── mixins.md
│       │   │   ├── shadow_root.md
│       │   │   └── web_element.md
│       │   ├── index.md
│       │   └── protocol/
│       │       ├── base.md
│       │       ├── browser.md
│       │       ├── dom.md
│       │       ├── fetch.md
│       │       ├── input.md
│       │       ├── network.md
│       │       ├── page.md
│       │       ├── runtime.md
│       │       ├── storage.md
│       │       └── target.md
│       ├── deep-dive/
│       │   ├── architecture/
│       │   │   ├── browser-domain.md
│       │   │   ├── browser-requests-architecture.md
│       │   │   ├── event-architecture.md
│       │   │   ├── find-elements-mixin.md
│       │   │   ├── index.md
│       │   │   ├── shadow-dom.md
│       │   │   ├── tab-domain.md
│       │   │   └── webelement-domain.md
│       │   ├── fingerprinting/
│       │   │   ├── behavioral-fingerprinting.md
│       │   │   ├── browser-fingerprinting.md
│       │   │   ├── evasion-techniques.md
│       │   │   ├── index.md
│       │   │   └── network-fingerprinting.md
│       │   ├── fundamentals/
│       │   │   ├── cdp.md
│       │   │   ├── connection-layer.md
│       │   │   ├── iframes-and-contexts.md
│       │   │   ├── index.md
│       │   │   └── typing-system.md
│       │   ├── guides/
│       │   │   ├── index.md
│       │   │   └── selectors-guide.md
│       │   ├── index.md
│       │   └── network/
│       │       ├── build-proxy.md
│       │       ├── http-proxies.md
│       │       ├── index.md
│       │       ├── network-fundamentals.md
│       │       ├── proxy-detection.md
│       │       ├── proxy-legal.md
│       │       └── socks-proxies.md
│       ├── features/
│       │   ├── advanced/
│       │   │   ├── behavioral-captcha-bypass.md
│       │   │   ├── decorators.md
│       │   │   ├── event-system.md
│       │   │   └── remote-connections.md
│       │   ├── automation/
│       │   │   ├── file-operations.md
│       │   │   ├── human-interactions.md
│       │   │   ├── iframes.md
│       │   │   ├── keyboard-control.md
│       │   │   ├── mouse-control.md
│       │   │   └── screenshots-and-pdfs.md
│       │   ├── browser-management/
│       │   │   ├── contexts.md
│       │   │   ├── cookies-sessions.md
│       │   │   └── tabs.md
│       │   ├── configuration/
│       │   │   ├── browser-options.md
│       │   │   ├── browser-preferences.md
│       │   │   └── proxy.md
│       │   ├── core-concepts.md
│       │   ├── element-finding.md
│       │   ├── index.md
│       │   └── network/
│       │       ├── http-requests.md
│       │       ├── interception.md
│       │       ├── monitoring.md
│       │       └── network-recording.md
│       └── index.md
├── examples/
│   └── cloudflare_bypass.py
├── mkdocs.yml
├── public/
│   ├── index.html
│   ├── robots.txt
│   ├── script.js
│   ├── scripts/
│   │   ├── extra.js
│   │   └── termynal.js
│   ├── sitemap.xml
│   └── stylesheets/
│       ├── extra.css
│       └── termynal.css
├── pydoll/
│   ├── __init__.py
│   ├── browser/
│   │   ├── __init__.py
│   │   ├── chromium/
│   │   │   ├── __init__.py
│   │   │   ├── base.py
│   │   │   ├── chrome.py
│   │   │   └── edge.py
│   │   ├── interfaces.py
│   │   ├── managers/
│   │   │   ├── __init__.py
│   │   │   ├── browser_options_manager.py
│   │   │   ├── browser_process_manager.py
│   │   │   ├── proxy_manager.py
│   │   │   └── temp_dir_manager.py
│   │   ├── options.py
│   │   ├── requests/
│   │   │   ├── __init__.py
│   │   │   ├── har_recorder.py
│   │   │   ├── request.py
│   │   │   └── response.py
│   │   └── tab.py
│   ├── commands/
│   │   ├── __init__.py
│   │   ├── browser_commands.py
│   │   ├── dom_commands.py
│   │   ├── emulation_commands.py
│   │   ├── fetch_commands.py
│   │   ├── input_commands.py
│   │   ├── network_commands.py
│   │   ├── page_commands.py
│   │   ├── runtime_commands.py
│   │   ├── storage_commands.py
│   │   └── target_commands.py
│   ├── connection/
│   │   ├── __init__.py
│   │   ├── connection_handler.py
│   │   └── managers/
│   │       ├── __init__.py
│   │       ├── commands_manager.py
│   │       └── events_manager.py
│   ├── constants.py
│   ├── decorators.py
│   ├── elements/
│   │   ├── __init__.py
│   │   ├── mixins/
│   │   │   ├── __init__.py
│   │   │   └── find_elements_mixin.py
│   │   ├── shadow_root.py
│   │   ├── utils/
│   │   │   ├── __init__.py
│   │   │   └── selector_parser.py
│   │   └── web_element.py
│   ├── exceptions.py
│   ├── interactions/
│   │   ├── __init__.py
│   │   ├── iframe.py
│   │   ├── keyboard.py
│   │   ├── mouse.py
│   │   ├── scroll.py
│   │   └── utils.py
│   ├── protocol/
│   │   ├── __init__.py
│   │   ├── base.py
│   │   ├── browser/
│   │   │   ├── __init__.py
│   │   │   ├── events.py
│   │   │   ├── methods.py
│   │   │   └── types.py
│   │   ├── debugger/
│   │   │   └── types.py
│   │   ├── dom/
│   │   │   ├── __init__.py
│   │   │   ├── events.py
│   │   │   ├── methods.py
│   │   │   └── types.py
│   │   ├── emulation/
│   │   │   ├── __init__.py
│   │   │   ├── methods.py
│   │   │   └── types.py
│   │   ├── fetch/
│   │   │   ├── __init__.py
│   │   │   ├── events.py
│   │   │   ├── methods.py
│   │   │   └── types.py
│   │   ├── input/
│   │   │   ├── __init__.py
│   │   │   ├── events.py
│   │   │   ├── methods.py
│   │   │   └── types.py
│   │   ├── io/
│   │   │   └── types.py
│   │   ├── network/
│   │   │   ├── __init__.py
│   │   │   ├── events.py
│   │   │   ├── har_types.py
│   │   │   ├── methods.py
│   │   │   └── types.py
│   │   ├── page/
│   │   │   ├── __init__.py
│   │   │   ├── events.py
│   │   │   ├── methods.py
│   │   │   └── types.py
│   │   ├── runtime/
│   │   │   ├── __init__.py
│   │   │   ├── events.py
│   │   │   ├── methods.py
│   │   │   └── types.py
│   │   ├── security/
│   │   │   └── types.py
│   │   ├── storage/
│   │   │   ├── __init__.py
│   │   │   ├── events.py
│   │   │   ├── methods.py
│   │   │   └── types.py
│   │   └── target/
│   │       ├── __init__.py
│   │       ├── events.py
│   │       ├── methods.py
│   │       └── types.py
│   ├── py.typed
│   └── utils/
│       ├── __init__.py
│       ├── bundle.py
│       ├── general.py
│       ├── socks5_proxy_forwarder.py
│       └── user_agent_parser.py
├── pyproject.toml
└── tests/
    ├── conftest.py
    ├── pages/
    │   ├── oopif/
    │   │   ├── oopif_content.html
    │   │   ├── oopif_main.html
    │   │   ├── oopif_nested.html
    │   │   └── oopif_shadow_iframe.html
    │   ├── shadow_dom_test.html
    │   ├── test_children.html
    │   ├── test_click_nested.html
    │   ├── test_click_nested_iframe_content.html
    │   ├── test_core_simple.html
    │   ├── test_frame_content.html
    │   ├── test_frameset.html
    │   ├── test_har_recording.html
    │   ├── test_iframe_content.html
    │   ├── test_iframe_nested.html
    │   ├── test_iframe_nested_level.html
    │   ├── test_iframe_parent_level.html
    │   ├── test_iframe_simple.html
    │   └── test_multiple_iframes.html
    ├── test_browser/
    │   ├── test_browser_base.py
    │   ├── test_browser_chrome.py
    │   ├── test_browser_edge.py
    │   ├── test_browser_options.py
    │   ├── test_browser_tab.py
    │   ├── test_har_recorder.py
    │   ├── test_requests_request.py
    │   ├── test_requests_response.py
    │   └── test_tab_request_integration.py
    ├── test_click_nested_integration.py
    ├── test_commands/
    │   ├── test_browser_commands.py
    │   ├── test_dom_commands.py
    │   ├── test_emulation_commands.py
    │   ├── test_fetch_commands.py
    │   ├── test_input_commands.py
    │   ├── test_network_commands.py
    │   ├── test_page_commands.py
    │   ├── test_runtime_commands.py
    │   ├── test_storage_commands.py
    │   └── test_target_commands.py
    ├── test_connection_handler.py
    ├── test_core_integration.py
    ├── test_decorators.py
    ├── test_events.py
    ├── test_exceptions.py
    ├── test_find_elements_mixin.py
    ├── test_har_recording_integration.py
    ├── test_iframe_integration.py
    ├── test_interactions/
    │   ├── __init__.py
    │   ├── test_iframe.py
    │   ├── test_keyboard.py
    │   ├── test_mouse.py
    │   └── test_scroll.py
    ├── test_managers/
    │   ├── test_browser_managers.py
    │   └── test_connection_managers.py
    ├── test_nested_oopif_integration.py
    ├── test_shadow_root.py
    ├── test_shadow_root_integration.py
    ├── test_socks5_proxy_forwarder.py
    ├── test_user_agent_parser.py
    ├── test_utils.py
    └── test_web_element.py

================================================
FILE CONTENTS
================================================

================================================
FILE: .github/FUNDING.yml
================================================
# These are supported funding model platforms
github: [thalissonvs]


================================================
FILE: .github/ISSUE_TEMPLATE/bug_report.yml
================================================
name: Bug Report
description: Report a bug in pydoll
title: "[Bug]: "
labels: ["bug", "needs-triage"]
body:
  - type: markdown
    attributes:
      value: |
        # pydoll Bug Report
        
        Thank you for taking the time to report a bug. This form will guide you through providing the information needed to address the issue effectively.
  
  - type: checkboxes
    id: checklist
    attributes:
      label: Checklist before reporting
      description: Please make sure you've completed the following steps before submitting a bug report.
      options:
        - label: I have searched for [similar issues](https://github.com/thalissonvs/pydoll/issues) and didn't find a duplicate.
          required: true
        - label: I have updated to the latest version of pydoll to verify the issue still exists.
          required: true
  
  - type: input
    id: version
    attributes:
      label: pydoll Version
      description: What version of pydoll are you using when encountering this bug?
      placeholder: e.g., 1.3.2
    validations:
      required: true
  
  - type: input
    id: python_version
    attributes:
      label: Python Version
      description: What version of Python are you using?
      placeholder: e.g., 3.10.4
    validations:
      required: true
  
  - type: dropdown
    id: os
    attributes:
      label: Operating System
      description: What operating system are you using?
      options:
        - Windows
        - macOS
        - Linux
        - Other (specify in environment details)
    validations:
      required: true
  
  - type: textarea
    id: description
    attributes:
      label: Bug Description
      description: A clear and concise description of what the bug is.
      placeholder: When I try to use X feature, the library fails with error message Y...
    validations:
      required: true
  
  - type: textarea
    id: reproduction_steps
    attributes:
      label: Steps to Reproduce
      description: Step by step instructions to reproduce the bug.
      placeholder: |
        1. Import the library using `import pydoll`
        2. Set up the client with `...`
        3. Call method X with parameters Y
        4. See error
    validations:
      required: true
  
  - type: textarea
    id: code_example
    attributes:
      label: Code Example
      description: |
        A minimal, self-contained code example that demonstrates the issue.
        This will be automatically formatted into code, so no need for backticks.
      render: python
      placeholder: |
        from pydoll import Client
        
        client = Client(...)
        
        # Code that triggers the bug
        result = client.some_method(...)
        print(result)
    validations:
      required: true
  
  - type: textarea
    id: expected_behavior
    attributes:
      label: Expected Behavior
      description: A clear and concise description of what you expected to happen.
      placeholder: The method should return X or perform Y...
    validations:
      required: false
  
  - type: textarea
    id: actual_behavior
    attributes:
      label: Actual Behavior
      description: What actually happened instead? Include full error messages and stack traces if applicable.
      placeholder: The method raised an exception...
    validations:
      required: false
  
  - type: textarea
    id: logs
    attributes:
      label: Relevant Log Output
      description: |
        If applicable, include any logs or error messages. 
        This will be automatically formatted, so no need for backticks.
      render: shell
      placeholder: |
        Traceback (most recent call last):
          File "example.py", line 10, in <module>
            ...
          File ".../pydoll/...", line N, in some_method
            ...
        SomeError: Error message
  
  - type: textarea
    id: additional_context
    attributes:
      label: Additional Context
      description: Add any other context about the problem here (environment details, potential causes, solutions you've tried, etc.)
      placeholder: I've tried reinstalling the package and using a different Python version, but the issue persists... 


================================================
FILE: .github/ISSUE_TEMPLATE/config.yml
================================================
blank_issues_enabled: true
contact_links:
  - name: Questions & Discussions
    url: https://github.com/thalissonvs/pydoll/discussions
    about: Please ask and answer questions here. 


================================================
FILE: .github/ISSUE_TEMPLATE/documentation.yml
================================================
name: Documentation Issue
description: Report missing, incorrect, or unclear documentation
title: "[Docs]: "
labels: ["documentation", "needs-triage"]
body:
  - type: markdown
    attributes:
      value: |
        # pydoll Documentation Issue
        
        Thank you for helping us improve the documentation. This form will guide you through providing the information needed to address documentation issues effectively.
  
  - type: checkboxes
    id: checklist
    attributes:
      label: Checklist before reporting
      description: Please make sure you've completed the following steps before submitting a documentation issue.
      options:
        - label: I have searched for [similar documentation issues](https://github.com/thalissonvs/pydoll/issues) and didn't find a duplicate.
          required: true
        - label: I have checked the latest documentation to verify this issue still exists.
          required: true
  
  - type: dropdown
    id: type
    attributes:
      label: Type of Documentation Issue
      description: What type of documentation issue are you reporting?
      options:
        - Missing documentation (information does not exist)
        - Incorrect documentation (information is wrong)
        - Unclear documentation (information is confusing or ambiguous)
        - Outdated documentation (information is no longer valid)
        - Other (please specify in description)
    validations:
      required: true
  
  - type: input
    id: location
    attributes:
      label: Documentation Location
      description: Where is the documentation with issues located? Provide URLs, file paths, or section names.
      placeholder: e.g., https://docs.example.com/pydoll/api.html#section, README.md, API Reference for Client class
    validations:
      required: true
  
  - type: textarea
    id: description
    attributes:
      label: Issue Description
      description: Describe the issue with the documentation in detail.
      placeholder: |
        The documentation for the `Client.connect()` method doesn't mention the timeout parameter, 
        which I discovered by looking at the source code.
    validations:
      required: true
  
  - type: textarea
    id: suggested_fix
    attributes:
      label: Suggested Fix
      description: If you have a suggestion for how to fix the documentation, please provide it here.
      placeholder: |
        Add the following to the `Client.connect()` documentation:
        
        ```
        Parameters:
          timeout (float, optional): Connection timeout in seconds. Defaults to 30.
        ```
  
  - type: textarea
    id: additional_info
    attributes:
      label: Additional Information
      description: Any additional context or information that might help address this documentation issue.
      placeholder: |
        I found this issue when trying to implement a connection with a shorter timeout for my specific use case.
  
  - type: dropdown
    id: contribution
    attributes:
      label: Contribution
      description: Would you be willing to contribute a fix for this documentation?
      options:
        - Yes, I'd be willing to submit a PR with the fix
        - No, I don't have the capacity to fix this
    validations:
      required: true 

================================================
FILE: .github/ISSUE_TEMPLATE/feature_request.yml
================================================
name: Feature Request
description: Suggest a new feature or enhancement for pydoll
title: "[Feature Request]: "
labels: ["enhancement", "needs-triage"]
body:
  - type: markdown
    attributes:
      value: |
        # pydoll Feature Request
        
        Thank you for taking the time to suggest a new feature. This form will guide you through providing the information needed to consider your suggestion effectively.
  
  - type: checkboxes
    id: checklist
    attributes:
      label: Checklist before requesting
      description: Please make sure you've completed the following steps before submitting a feature request.
      options:
        - label: I have searched for [similar feature requests](https://github.com/thalissonvs/pydoll/issues) and didn't find a duplicate.
          required: true
        - label: I have checked the documentation to confirm this feature doesn't already exist.
          required: true
  
  - type: textarea
    id: problem
    attributes:
      label: Problem Statement
      description: Is your feature request related to a problem? Please describe what you're trying to accomplish.
      placeholder: I'm trying to accomplish X, but I'm unable to because Y...
    validations:
      required: true
  
  - type: textarea
    id: solution
    attributes:
      label: Proposed Solution
      description: Describe the solution you'd like to see implemented. Be as specific as possible.
      placeholder: |
        I would like to see a new method/class that can...
        
        Example usage might look like:
        ```python
        client.new_feature(param1, param2)
        ```
    validations:
      required: true
  
  - type: textarea
    id: alternatives
    attributes:
      label: Alternatives Considered
      description: Describe any alternative solutions or features you've considered.
      placeholder: I've tried accomplishing this using X and Y approaches, but they don't work well because...
  
  - type: textarea
    id: context
    attributes:
      label: Additional Context
      description: Add any other context, code examples, or references that might help explain your feature request.
      placeholder: |
        Other libraries like X and Y have similar features that work like...
        
        This would help users who need to...
  
  - type: dropdown
    id: importance
    attributes:
      label: Importance
      description: How important is this feature to your use case?
      options:
        - Nice to have
        - Important
        - Critical (blocking my usage)
    validations:
      required: true
  
  - type: dropdown
    id: contribution
    attributes:
      label: Contribution
      description: Would you be willing to contribute this feature yourself?
      options:
        - Yes, I'd be willing to implement this feature
        - I could help with parts of the implementation
        - No, I don't have the capacity to implement this 

================================================
FILE: .github/ISSUE_TEMPLATE/refactoring.yml
================================================
name: Refactoring Request
description: Suggest code refactoring to improve pydoll's quality, performance, or maintainability
title: "[Refactor]: "
labels: ["refactor", "needs-triage"]
body:
  - type: markdown
    attributes:
      value: |
        # pydoll Refactoring Request
        
        Thank you for suggesting improvements to our codebase. This form will guide you through providing the information needed to consider your refactoring suggestion effectively.
  
  - type: checkboxes
    id: checklist
    attributes:
      label: Checklist before suggesting refactoring
      description: Please make sure you've completed the following steps before submitting a refactoring request.
      options:
        - label: I have searched for [similar refactoring requests](https://github.com/thalissonvs/pydoll/issues) and didn't find a duplicate.
          required: true
        - label: I have reviewed the current implementation to ensure my understanding is accurate.
          required: true
  
  - type: textarea
    id: current_implementation
    attributes:
      label: Current Implementation
      description: Describe the current implementation and its limitations. Include file paths if known.
      placeholder: |
        The current implementation in `pydoll/module/file.py` has the following issues:
        1. It uses an inefficient algorithm for...
        2. The code structure makes it difficult to maintain because...
    validations:
      required: true
  
  - type: textarea
    id: proposed_changes
    attributes:
      label: Proposed Changes
      description: Describe the changes you're suggesting. Be as specific as possible.
      placeholder: |
        I suggest refactoring this code to:
        1. Replace the current algorithm with X, which would improve performance by...
        2. Restructure the class hierarchy to better separate concerns by...
        
        Example code sketch (if applicable):
        ```python
        def improved_method():
            # better implementation
        ```
    validations:
      required: true
  
  - type: textarea
    id: benefits
    attributes:
      label: Benefits
      description: Explain the benefits of this refactoring.
      placeholder: |
        This refactoring would:
        - Improve performance by X%
        - Make the code more maintainable by...
        - Reduce code complexity by...
        - Fix potential bugs such as...
    validations:
      required: true
  
  - type: dropdown
    id: impact
    attributes:
      label: API Impact
      description: Would this refactoring change the public API?
      options:
        - No API changes (internal refactoring only)
        - Minor API changes (backward compatible)
        - Breaking API changes
    validations:
      required: true
  
  - type: textarea
    id: testing_approach
    attributes:
      label: Testing Approach
      description: How can we verify that the refactoring doesn't break existing functionality?
      placeholder: |
        The refactoring can be tested by:
        - Running the existing test suite
        - Adding new tests for edge cases such as...
        - Benchmarking performance before and after
  
  - type: dropdown
    id: contribution
    attributes:
      label: Contribution
      description: Would you be willing to contribute this refactoring yourself?
      options:
        - Yes, I'd be willing to implement this refactoring
        - I could help with parts of the implementation
        - No, I don't have the capacity to implement this 

================================================
FILE: .github/PULL_REQUEST_TEMPLATE/bug_fix.md
================================================
# Bug Fix Pull Request

## Related Issue(s)
<!-- Link the bug report that's being fixed by this PR. Use the format: "Fixes #123" or "Resolves #123" -->

## Bug Description
<!-- Briefly describe the bug that's being fixed -->

## Root Cause
<!-- Explain the root cause of the bug -->

## Solution
<!-- Describe your solution to fix the bug -->

## Verification Steps
<!-- List the steps to verify this fix works -->
1. 
2. 
3. 

## Code Example
<!-- If applicable, provide a code example demonstrating the fix -->
```python
# Example code showing the fix
```

## Before / After
<!-- If applicable, provide before/after screenshots or code snippets -->

## Testing
<!-- Describe the tests you added or modified to verify your fix -->

## Testing Checklist
- [ ] Added regression test that would have caught this bug
- [ ] Modified existing tests to account for this fix
- [ ] All tests pass
- [ ] Edge cases have been tested

## Impact
<!-- Describe any potential impact this fix might have on existing functionality -->
- [ ] Low (isolated fix with no side effects)
- [ ] Medium (might affect closely related functionality)
- [ ] High (affects multiple areas or changes core behavior)

## Backwards Compatibility
- [ ] This change is fully backward compatible
- [ ] This change introduces backward incompatibilities (explain below)

## Checklist before requesting a review
- [ ] My code follows the style guidelines of this project
- [ ] I have performed a self-review of my code
- [ ] I have added test cases that prove my fix is effective
- [ ] I have run `poetry run task lint` and fixed any issues
- [ ] I have run `poetry run task test` and all tests pass
- [ ] My commits follow the [conventional commits](https://www.conventionalcommits.org/) style with message explaining the fix 

================================================
FILE: .github/PULL_REQUEST_TEMPLATE/refactoring.md
================================================
# Refactoring Pull Request

## Refactoring Scope
<!-- Describe which part of the codebase is being refactored -->

## Related Issue(s)
<!-- Link the refactoring issue that's being addressed by this PR. Use the format: "Fixes #123" or "Resolves #123" -->

## Description
<!-- Provide a clear and detailed description of the refactoring changes -->

## Motivation
<!-- Explain why this refactoring is necessary -->

## Before / After
<!-- If applicable, provide code examples showing the before and after of the refactoring -->

### Before
```python
# Original code
```

### After
```python
# Refactored code
```

## Performance Impact
<!-- If applicable, describe any performance improvements or potential impacts -->
- [ ] Performance improved
- [ ] Performance potentially decreased
- [ ] No significant performance change
- [ ] Performance impact unknown

## Technical Debt
<!-- Describe how this refactoring addresses technical debt -->

## API Changes
- [ ] No changes to public API
- [ ] Public API changed, but backward compatible
- [ ] Breaking changes to public API

## Testing Strategy
<!-- Describe how you've tested the refactoring -->

## Testing Checklist
- [ ] Existing tests updated
- [ ] New tests added for previously uncovered cases
- [ ] All tests pass
- [ ] Code coverage maintained or improved

## Risks and Mitigations
<!-- Describe any potential risks introduced by this refactoring and how they were mitigated -->

## Checklist before requesting a review
- [ ] My code follows the style guidelines of this project
- [ ] I have performed a thorough self-review of the refactored code
- [ ] I have commented my code, particularly in complex areas
- [ ] I have updated documentation if needed
- [ ] I have run `poetry run task lint` and fixed any issues
- [ ] I have run `poetry run task test` and all tests pass
- [ ] My commits follow the [conventional commits](https://www.conventionalcommits.org/) style 

================================================
FILE: .github/PULL_REQUEST_TEMPLATE/release.md
================================================
# Release Pull Request

## Version
<!-- Specify the new version number (e.g., 1.4.0) -->

## Release Date
<!-- Proposed date for this release -->

## Release Type
- [ ] Major (breaking changes)
- [ ] Minor (new features, non-breaking)
- [ ] Patch (bug fixes, non-breaking)

## Change Summary
<!-- Provide a high-level summary of the changes in this release -->

## Key Changes
<!-- List the major changes/features included in this release -->

## Breaking Changes
<!-- If applicable, list all breaking changes and migration instructions -->

## Dependencies
<!-- List any new or updated dependencies -->

## Deprecations 
- While `get_element_text()` is still supported, it is **recommended** to use the new async property `element.text`.


## Documentation
<!-- Link to updated documentation -->

## Release Checklist
- [ ] Version number updated in pyproject.toml
- [ ] Version number updated in cz.yaml
- [ ] CHANGELOG.md updated with all changes
- [ ] All tests passing
- [ ] Documentation updated
- [ ] API reference updated
- [ ] Breaking changes documented
- [ ] Migration guides prepared (if applicable)

## Additional Release Notes
<!-- Any additional information that should be included in release notes --> 

================================================
FILE: .github/pull_request_template.md
================================================
<!-- 
Please choose the appropriate PR template for your change:

For bug fixes: .github/PULL_REQUEST_TEMPLATE/bug_fix.md
For refactoring: .github/PULL_REQUEST_TEMPLATE/refactoring.md
For releases: .github/PULL_REQUEST_TEMPLATE/release.md

Or use this general template for other types of changes.
-->

# Pull Request

## Description
<!-- Provide a clear and concise description of what this PR accomplishes -->

## Related Issue(s)
<!-- Link the issues that are being addressed by this PR. Use the format: "Fixes #123" or "Resolves #123" -->

## Type of Change
<!-- Check the appropriate options that apply to this PR -->
- [ ] Bug fix (non-breaking change which fixes an issue)
- [ ] New feature (non-breaking change which adds functionality)
- [ ] Breaking change (fix or feature that would cause existing functionality to not work as expected)
- [ ] Documentation update
- [ ] Refactoring (no functional changes, no API changes)
- [ ] Performance improvement
- [ ] Tests (adding missing tests or correcting existing tests)
- [ ] Build or CI/CD related changes

## How Has This Been Tested?
<!-- Describe the tests you ran to verify your changes. Provide instructions so reviewers can reproduce. -->

```python
# Include code examples if relevant
```

## Testing Checklist
<!-- Check the testing aspects that apply to your change -->
- [ ] Unit tests added/updated
- [ ] Integration tests added/updated
- [ ] All existing tests pass

## Screenshots
<!-- If applicable, add screenshots to help explain your changes -->

## Implementation Details
<!-- Provide any important details or context about the implementation -->

## API Changes
<!-- If applicable, describe any API changes -->

## Additional Info
<!-- Any additional information that might be useful for reviewers -->

## Checklist before requesting a review
- [ ] My code follows the style guidelines of this project
- [ ] I have performed a self-review of my code
- [ ] I have commented my code, particularly in hard-to-understand areas
- [ ] I have made corresponding changes to the documentation
- [ ] My changes generate no new warnings
- [ ] I have added tests that prove my fix is effective or that my feature works
- [ ] New and existing unit tests pass locally with my changes
- [ ] I have run `poetry run task lint` and fixed any issues
- [ ] I have run `poetry run task test` and all tests pass
- [ ] My commits follow the [conventional commits](https://www.conventionalcommits.org/) style 

================================================
FILE: .github/workflows/deploy-docs.yml
================================================
name: Deploy site + docs

on:
  push:
    branches: [main]

jobs:
  deploy:
    runs-on: ubuntu-latest
    steps:
      - name: Code Checkout
        uses: actions/checkout@v4

      - name: Setup Python
        uses: actions/setup-python@v5
        with:
          python-version: '3.x'

      - name: Install Dependencies
        run: |
          python -m pip install --upgrade pip
          pip install mkdocs mkdocs-material pymdown-extensions mkdocstrings[python] mkdocs-static-i18n

      # Build MkDocs em pasta temporária
      - name: Build MkDocs into temp folder
        run: mkdocs build --site-dir temp_docs

      # Criar estrutura final do site
      - name: Prepare final site
        run: |
          mkdir -p site/docs
          mkdir -p site/images
          cp -r temp_docs/* site/docs/
          cp -r public/* site/

      - name: Deploy to GitHub Pages
        uses: peaceiris/actions-gh-pages@v3
        with:
          github_token: ${{ secrets.GITHUB_TOKEN }}
          publish_dir: ./site
          cname: pydoll.tech


================================================
FILE: .github/workflows/mypy.yml
================================================
name: MyPy CI

on:
  push:
    branches:
      - '*'         # matches every branch that doesn't contain a '/'
      - '*/*'       # matches every branch containing a single '/'
      - '**'        # matches every branch
  pull_request:

jobs:
  build:

    runs-on: ubuntu-latest

    strategy:
      max-parallel: 4
      matrix:
        python-version: ["3.11"]

    steps:
      - uses: actions/checkout@v2

      - name: Set up Python ${{ matrix.python-version }}
        uses: actions/setup-python@v2
        with:
          python-version: ${{ matrix.python-version }}

      - name: Install Dependencies
        run: |
          python -m pip install --upgrade pip
          python -m pip install mypy
          python -m pip install -e .
          python -m mypy --install-types --non-interactive pydoll 

      - name: mypy
        run: python -m mypy .


================================================
FILE: .github/workflows/publish.yml
================================================
name: Publish to PyPI (Poetry)

on: workflow_dispatch

jobs:
  deploy:
    runs-on: ubuntu-latest

    steps:
      - name: Checkout code
        uses: actions/checkout@v3

      - name: Set up Python
        uses: actions/setup-python@v4
        with:
          python-version: "3.10"

      - name: Install Poetry
        run: |
          python -m pip install --upgrade pip
          pip install poetry

      - name: Configure Poetry
        run: poetry config pypi-token.pypi ${{ secrets.PYPI_API_TOKEN }}

      - name: Install dependencies
        run: poetry install

      - name: Build package
        run: poetry build

      - name: Publish to PyPI
        run: poetry publish


================================================
FILE: .github/workflows/release.yml
================================================
name: Release
on: workflow_dispatch

jobs:
  version-cz:
    runs-on: ubuntu-latest
    name: "Version CZ"
    outputs:
      version: ${{ steps.cz.outputs.version }}

    steps:
      - name: Checkout
        uses: actions/checkout@v4
        with:
          fetch-depth: 0
          token: ${{ secrets.GITHUB_TOKEN }}

      - id: cz
        name: Create bump and changelog
        uses: commitizen-tools/commitizen-action@master
        with:
          github_token: ${{ secrets.GITHUB_TOKEN }}

      - name: Print Version
        run: echo "Bumped to version ${{ steps.cz.outputs.version }}"
  
  version-pyproject:
    runs-on: ubuntu-latest
    name: "Version Pyproject"
    needs: version-cz
    outputs:
      version: ${{ needs.version-cz.outputs.version }}
    steps:
      - name: Checkout
        uses: actions/checkout@v4
        with:
          fetch-depth: 0
          token: ${{ secrets.GITHUB_TOKEN }}

      - name: Install Poetry
        run: |
          curl -sSL https://install.python-poetry.org | python3 -
          export PATH="$HOME/.local/bin:$PATH"

      - name: Update Poetry version in pyproject.toml
        run: |
          git config --global user.name "github-actions[bot]"
          git config --global user.email "github-actions[bot]@users.noreply.github.com"
          poetry version "${{ needs.version-cz.outputs.version }}"
          git add pyproject.toml
          git commit -m "Update pyproject.toml to version ${{ needs.version-cz.outputs.version }}"
          git pull --rebase
          git push

      - name: Update poetry.lock
        continue-on-error: true
        run: |
          git config --global user.name "github-actions[bot]"
          git config --global user.email "github-actions[bot]@users.noreply.github.com"
          poetry lock
          git add poetry.lock
          git commit -m "Update poetry.lock"
          git pull --rebase
          git push


  release:
    name: Release
    needs: version-pyproject
    runs-on: ubuntu-latest
    steps:
      - name: Create Release
        uses: softprops/action-gh-release@v1
        with:
          draft: false
          prerelease: false
          generate_release_notes: true
          tag_name: ${{ needs.version-pyproject.outputs.version }}
        env:
          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}


================================================
FILE: .github/workflows/ruff-ci.yml
================================================
name: Ruff CI

on:
  push:
    branches:
      - '*'         # matches every branch that doesn't contain a '/'
      - '*/*'       # matches every branch containing a single '/'
      - '**'        # matches every branch
  pull_request:

jobs:
  build:

    runs-on: ubuntu-latest

    strategy:
      max-parallel: 4
      matrix:
        python-version: ["3.11"]

    steps:
      - uses: actions/checkout@v2

      - name: Set up Python ${{ matrix.python-version }}
        uses: actions/setup-python@v2
        with:
          python-version: ${{ matrix.python-version }}

      - name: Install Dependencies
        run: |
          python -m pip install --upgrade pip
          python -m pip install ruff==0.7.1

      - name: ruff
        run: python -m ruff check .


================================================
FILE: .github/workflows/tests.yml
================================================
name: PyDoll Tests

on:
  push:
  pull_request:

jobs:
  tests:
    strategy:
      fail-fast: false
      matrix:
        os: [ubuntu-latest, windows-latest]
        python-version: ["3.10", "3.11", "3.12", "3.13"]
    runs-on: ${{ matrix.os }}
    steps:
      - uses: actions/checkout@v3
      - name: Set up Python ${{ matrix.python-version }}
        uses: actions/setup-python@v4
        with:
          python-version: ${{ matrix.python-version }}
      - name: Install dependencies
        run: |
          python -m pip install poetry
          poetry install
      - name: Install Chrome
        uses: browser-actions/setup-chrome@v1
        with:
          chrome-version: 132
      - name: Run tests with coverage
        run: |
          poetry run pytest -s -x --cov=pydoll -vv --cov-report=xml

      - name: Upload coverage to Codecov
        uses: codecov/codecov-action@v5
        with:
          file: ./coverage.xml
          flags: tests
          name: PyDoll Tests
          fail_ci_if_error: true
          token: ${{ secrets.CODECOV_TOKEN }}


================================================
FILE: .gitignore
================================================
__pycache__/
*.py[cod]
*$py.class

# C extensions
*.so

# Distribution / packaging
.Python
build/
develop-eggs/
dist/
downloads/
eggs/
.eggs/
lib/
lib64/
parts/
sdist/
var/
wheels/
share/python-wheels/
*.egg-info/
.installed.cfg
*.egg
MANIFEST

# PyInstaller
#  Usually these files are written by a python script from a template
#  before PyInstaller builds the exe, so as to inject date/other infos into it.
*.manifest
*.spec

# Installer logs
pip-log.txt
pip-delete-this-directory.txt

# Unit test / coverage reports
htmlcov/
.tox/
.nox/
.coverage
.coverage.*
.cache
nosetests.xml
coverage.xml
*.cover
*.py,cover
.hypothesis/
.pytest_cache/
cover/

# Translations
*.mo
*.pot

# Django stuff:
*.log
local_settings.py
db.sqlite3
db.sqlite3-journal

# Flask stuff:
instance/
.webassets-cache

# Scrapy stuff:
.scrapy

# Sphinx documentation
docs/_build/

# PyBuilder
.pybuilder/


# Jupyter Notebook
.ipynb_checkpoints

# IPython
profile_default/
ipython_config.py

# pyenv
#   For a library or package, you might want to ignore these files since the code is
#   intended to run in multiple environments; otherwise, check them in:
# .python-version

# pipenv
#   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
#   However, in case of collaboration, if having platform-specific dependencies or dependencies
#   having no cross-platform support, pipenv may install dependencies that don't work, or not
#   install all needed dependencies.
#Pipfile.lock

# poetry
#   Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
#   This is especially recommended for binary packages to ensure reproducibility, and is more
#   commonly ignored for libraries.
#   https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
#poetry.lock

# pdm
#   Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
#pdm.lock
#   pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
#   in version control.
#   https://pdm.fming.dev/latest/usage/project/#working-with-version-control
.pdm.toml
.pdm-python
.pdm-build/

# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
__pypackages__/

# Celery stuff
celerybeat-schedule
celerybeat.pid

# SageMath parsed files
*.sage.py

# Environments
.env
.venv
env/
venv/
ENV/
env.bak/
venv.bak/

# Spyder project settings
.spyderproject
.spyproject

# Rope project settings
.ropeproject

# mkdocs documentation
/site

# mypy
.mypy_cache/
.dmypy.json
dmypy.json

# Pyre type checker
.pyre/

# pytype static type analyzer
.pytype/

# Cython debug symbols
cython_debug/

# PyCharm
#  JetBrains specific template is maintained in a separate JetBrains.gitignore that can
#  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
#  and can be added to the global gitignore or merged into this file.  For a more nuclear
#  option (not recommended) you can uncomment the following to ignore the entire idea folder.
#.idea/

.czrc
.ruff_cache/

# Dev test file
dev_test_file.py


================================================
FILE: .python-version
================================================
3.12.5


================================================
FILE: CHANGELOG.md
================================================
## 2.21.3 (2026-03-14)

### Fix

- **test**: improve OOPIF integration test reliability
- **iframe**: resolve nested OOPIF iframes inside shadow roots

## 2.21.2 (2026-03-12)

### Fix

- release commit

## 2.21.1 (2026-03-03)

### Fix

- **keyboard**: send correct key, code and keycode in type_text
- **elements**: fix humanized interactions inside iframes
- humanized scroll overshoot correction causes infinite loop

## 2.21.0 (2026-03-01)

### Feat

- **interactions**: change humanize default from True to False

### Fix

- **elements**: forward humanize flag to click in type_text

## 2.20.2 (2026-02-18)

### Fix

- **command**: increase default command timeout from 10s to 60s across multiple components
- **tab**: remove temporary flag to avoid duplicate callback removal

## 2.20.1 (2026-02-16)

### Fix

- **tab**: replace readyState polling with CDP events in navigation

## 2.20.0 (2026-02-13)

### Feat

- **mouse**: add timing property for runtime configuration
- **requests**: add record() and replay() to Request class
- **requests**: add HAR network recorder
- **protocol**: add HAR 1.2 type definitions

### Fix

- **requests**: use surgical callback removal instead of nuclear clear_callbacks

### Refactor

- **tab**: extract bundle static methods to utils module

## 2.19.0 (2026-02-12)

### Feat

- **interactions**: default humanize=True for keyboard type_text
- **elements**: integrate Mouse API into WebElement.click()
- **interactions**: add Mouse API with humanized simulation
- **browser**: add webrtc_leak_protection property to ChromiumOptions
- **browser**: add automatic User-Agent consistency override

### Fix

- **utils**: harden SOCKS5 proxy forwarder security and robustness

## 2.18.0 (2026-02-11)

### Feat

- **utils**: add SOCKS5 proxy forwarder and convert utils to package
- **elements**: add cross-iframe selector support for XPath and CSS

## 2.17.0 (2026-02-08)

### Feat

- **tab**: refactor cloudflare bypass to use shadow root traversal
- **elements**: add shadow root timeout, CSS restriction and context propagation
- **tab**: add find_shadow_roots with OOPIF traversal and timeout
- **elements**: add shadow DOM support

### Fix

- **docs**: replace shadow.find() with query() in all documentation
- **tests**: replace shadow.find() with query() in integration tests
- **elements**: use float timeout and add contextual WaitElementTimeout messages

## 2.16.0 (2026-02-06)

### Feat

- add clear method for input and enhance page load state handling

### Fix

- **browser**: support secure websocket connections

## 2.15.1 (2026-01-04)

### Fix

- filter Symbol properties from element query results

## 2.15.0 (2025-12-24)

### Feat

- Implement incognito mode cookie retrieval for `tab.get_cookies()` and update related documentation

### Fix

- inconsistence in type checking
- Dispatch `KEY_DOWN` and `KEY_UP` events for character typing

## 2.14.0 (2025-12-10)

### Feat

- get_tab_by_target method added
- get_tab_by_target method added

### Fix

- adding type: ignore in JavascriptDialogOpeningEvent object
- adding type: ignore in JavascriptDialogOpeningEvent object

## 2.13.1 (2025-12-07)

### Fix

- add stuck scroll detection and minimum flick distance to humanized scroll, and correct scroll distance calculation.

## 2.13.0 (2025-12-07)

### Feat

- Implement humanized keyboard typing and physics-based scroll, and add iframe interaction support.

## 2.12.4 (2025-11-29)

### Fix

- optimize iframe resolution logic by adjusting backend node ID checks and enhancing child frame handling
- refine OOPIF resolution and frame attachment logic for improved handling of backend node IDs
- enhance OOPIF target attachment logic for improved session handling

## 2.12.3 (2025-11-27)

### Fix

- improve frame retrieval logic for better session handling

## 2.12.2 (2025-11-19)

### Fix

- adjust find_elements_mixin.py to refine return types and defaults

## 2.12.1 (2025-11-14)

### Fix

- continue cleanup process if temporary directory still exists
- adjust sleep duration for Windows and enhance temp dir cleanup
- enhance error handling for locked files on Windows systems
- remove unnecessary retry_times parameter in file processing
- ensure temp directory cleanup handles Chromium locked files
- enhance element selection and text extraction for better stability
- handle oopif targets
- change way to interact with iframes

### Refactor

- refactor iframe context handling in FindElementsMixin class

### Perf

- update Chrome options for better memory management and stability

## 2.12.0 (2025-11-04)

### Feat

- **execute_script**: validate element argument usage
- **tab,element,chrome**: revert arguments and add Chromium paths
- add a retry decorator for handling function execution failures

### Fix

- import TopLevelTargetRequired in test_browser_tab.py
- allow one additional retry attempt in the retry decorator

### Refactor

- **tab,element**: simplify execute_script parameters
- **element**: move and enhance execute_script from tab
- **tab**: separate execute_script concerns and enhance with comprehensive options

## 2.11.0 (2025-11-02)

### Feat

- add input handling functions and key constants for editing
- add KeyboardAPI for simulating keyboard input actions
- add KeyboardAPI integration for enhanced keyboard control

### Fix

- enhance text insertion and deprecate legacy key methods

## 2.10.0 (2025-11-01)

### Feat

- add ScrollAPI for enhanced page scrolling capabilities

## 2.9.3 (2025-10-30)

### Refactor

- keep take_screenshot consistent
- refactor type hints for better clarity and future compatibility

## 2.9.2 (2025-10-19)

### Fix

- update process creation to capture output and clean proxy format
- preserve query and fragment in WebSocket URL for tabs

### Refactor

- remove debug logging for request status and network events
- refactor logger messages to use consistent single quotes
- fix merge conflicts
- add logging for browser lifecycle and context management events
- refactor proxy parsing logic for improved clarity and efficiency

## 2.9.1 (2025-10-15)

### Fix

- change download event handling to use PageEvent instead of BrowserEvent

### Refactor

- use early return in setup proxy method

## 2.9.0 (2025-10-05)

### Feat

- add configurable page load state

## 2.8.2 (2025-10-03)

### Fix

- implement proxy authentication handling for browser tabs
- map exception when try to take screenshot of an iframe

## 2.8.1 (2025-09-27)

### Fix

- store the opened tab in the _tabs_opened dictionary
- **elements**: correctly detect parenthesized XPath expressions

### Refactor

- simplify FindElementsMixin._get_expression_type startswith checks into single tuple

## 2.8.0 (2025-08-28)

### Feat

- adding get_siblings_elements method
- adding get_children_elements method
- refactor Tab class to support optional WebSocket address handling
- add WebSocket connection support for existing browser instances
- add optional WebSocket address support in connection handler

### Fix

- add get siblings and get childen methods a raise_exc option
- improving children and parent retrive docstring and creating a private generic method for then
- using new execute_script public method
- solving conflicts
- rename pages fixtures files and adding a error test

### Refactor

- refactor Tab class to improve initialization and error handling
- refactor Browser class to manage opened tabs and WebSocket setup
- add new exception classes for connection and WebSocket errors

## 2.7.0 (2025-08-22)

### Feat

- refactor WebElement methods to use a unified naming convention
- add Response type and new bring_to_front method to Tab class
- improve element interactability scripts

### Fix

- **browser**: add google-chrome-stable path for Arch Linux AUR package
- run actions to fix badges
- enforce combined condition logic in wait_until
- **web_element**: raise WaitElementTimeout on wait_until timeout

### Refactor

- update command responses to use Response for empty responses
- **webelement**: simplify wait_until condition mapping

## 2.6.0 (2025-08-10)

### Feat

- add DownloadTimeout exception for file download timeouts
- add context manager for handling file downloads in Tab class

### Refactor

- add type checking for connection handler in mixin class
- add type overloads for event callback in Browser class

## 2.5.0 (2025-08-07)

### Feat

- add HTTP client functionality using the browser's fetch API
- add HTTP response object for browser-based fetch requests
- implement Request class for HTTP requests using fetch API
- add Request handling and improve network log retrieval methods

### Fix

- reject cookies with empty names during parsing in Request class
- refactor imports to include NotRequired and TypedDict from typing_extensions
- update imports to use typing_extensions for compatibility reasons
- check for None in events_enabled before updating params
- remove unused event type aliases and clean up imports

### Refactor

- depreciating headless argument in start method and adding it in to browser options properties
- add asynchronous function for makeRequest in JavaScript
- refactor imports for cleaner organization and improved clarity
- refactor type hints in FindElementsMixin for clarity and type safety
- refactor type hints and improve command method signatures
- refactor event handling to use specific event types for clarity
- refactor connection handler to use CDPEvent and typed commands
- refactor storage command methods to return specific command types
- refactor target command methods to use specific command types
- refactor command return types to specific command classes
- refactor page commands to use specific command types directly
- refactor network commands to use specific command types
- refactor input command methods to return specific command types
- refactor fetch_commands to use updated type definitions
- refactor enums to inherit from str for better compatibility
- refactor DOM command types for improved code clarity and structure
- refactor command and event parameter types for better typing
- refactor command responses to use EmptyResponse where applicable
- improve protocol types for target domain
- improve protocol types for storage domain
- refactor command response types for improved readability and consistency
- improve protocol types for page domain
- add IncludeWhitespace and RelationType enums to DOM types
- improve protocol types for input domain
- refactor AuthChallengeResponse and remove legacy definitions
- remove legacy WindowBoundsDict for cleaner type definitions
- add new TypedDicts and enums for runtime event parameters
- refactor DOM event types and methods for better clarity and structure
- refactor fetch command return types for better clarity and structure
- enhance browser command functionality with new methods and types
- add TypedDict and Enum definitions for emulation and debugging
- improve protocol types for network domain

## 2.4.0 (2025-08-01)

### Feat

- changing bool prefs to properties and adding support to user-data-dir preferences
- adding prefs options customization
- add overloads for find and query methods in FindElementsMixin
- add method to retrieve parent element and its attributes
- implements start_timeout option

### Fix

- adding typehint and fixing some codes
- removing options preferences private attributes
- set default URL to 'about:blank' in create_target method
- change navigation when creating a new tab
- add type hinting support and update project description

### Refactor

- remove redundant asterisk from find method overloads and reorganize query method overloads
- refine type hint for response parameter and improve key check

## 2.3.1 (2025-07-12)

### Fix

- refactor click_option_tag to use direct script reference
- update script to use closest for more reliable DOM selection
- improve selection script for higher accuracy
- use correct class name and id selector in query()
- add fetch command methods to handle request processing

### Refactor

- change body type from dict to string in fetch command parameters
- refactor continue_request and fulfill_request to use options
- enhance continue_request and fulfill_request with new options

## 2.3.0 (2025-06-25)

### Feat

- **connection**: Upgrade adapt websockets version to 14.0

### Fix

- refine selector condition to include attributes check

## 2.2.3 (2025-06-20)

### Fix

- fix contextmanager for file upload

## 2.2.2 (2025-06-18)

### Fix

- fix call_function_on parameters order

### Refactor

- replace BeautifulSoup with custom HTML text extractor

## 2.2.1 (2025-06-16)

### Fix

- fix call parameters order in call_function_on method

## 2.2.0 (2025-06-15)

### Feat

- add method to retrieve non-extension opened tabs as Tab instances

### Refactor

- refactor attribute assignments to include type annotations
- implement singleton pattern for Tab instances by target_id

## 2.1.0 (2025-06-14)

### Feat

- add new script-related exception classes for better handling
- add functions to clean scripts and check return statements
- add methods to retrieve network response body and logs

### Fix

- click in the input before typing and fix documentation

### Refactor

- add overloads for execute_script to improve type safety

## 2.0.1 (2025-06-08)

### Fix

- fix private proxy configuration

## 2.0.0 (2025-06-08)

### BREAKING CHANGE

- pydoll v2 finished

### Feat

- intuitive way to interact with iframes
- refactor Keys class to Key and add utility methods for enums
- add Event TypedDict for standardized event structure
- add TargetEvent enum for Chrome DevTools Protocol events
- add StorageEvent enumeration for Chrome DevTools Protocol events
- add RuntimeEvent enumeration for Chrome DevTools Protocol events
- add PageEvent enumeration for Chrome DevTools Protocol events
- add NetworkEvent enumeration for Chrome DevTools Protocol events
- add InputEvent enum for Chrome DevTools input events
- add FetchEvent enumeration for Chrome DevTools Protocol events
- add DomEvent enumeration for Chrome DevTools Protocol events
- add BrowserEvent enum for Chrome DevTools protocol events
- add methods to enable and disable the runtime domain commands
- add new enums for whitespace, axes, pseudo types, and modes
- add DOM response types and corresponding response classes
- add DOM command types and parameter definitions for pydoll
- add enums for key, mouse, touch, and drag event types
- add input command types for touch, mouse, and keyboard events
- enhance TargetCommands class with new methods for targets management
- add TypedDicts for target response types and browser contexts
- add TypedDict definitions for target command parameters
- add storage-related enumerations for bucket durability and types
- enhance StorageCommands with new methods for data management
- add storage response types and related classes for handling data
- add storage command types using TypedDict for structured params
- add new enumeration classes for serialization and object types
- add runtime response types for handling various object previews
- add initial runtime command types for protocol handling
- add constants for various encoding, formats, and policies
- add TypedDict definitions for page response types and results
- add typed dictionaries for various page command parameters
- add new command parameter classes for network resource handling
- add TypedDict definitions for network response types
- organize command types into structured imports and exports
- add network command types and parameters for cookie management
- add enums for cookie priorities, connection types, and encodings
- add response classes for browser window target retrieval
- setup mkdocs and install related packages
- add async text property for retrieving element text

### Fix

- remove target directory from .gitignore file
- fix typo in USB_UNRESTRICTED constant for consistency
- add new network command parameters and methods for cookies
- change postData type from dict to string in ContinueRequestParams

### Refactor

- refactor screenshot path handling and enhance error checking
- refactor type hints from List to built-in list for consistency
- refine XPath condition handling and ensure integer coordinates
- refactor condition checks to ensure against None values
- refactor exception handling and add browser path validation function
- rename BrowserOptionsManager to ChromiumOptionsManager
- refactor Edge class to use ChromiumOptionsManager and simplify path validation
- refactor Chrome class to use Chromium-specific options manager
- refactor Browser class to use options manager and improve methods
- refactor Options class to ChromiumOptions and use type hints
- refactor to create ChromiumOptionsManager for better clarity
- add abstract base classes for browser options management
- use `message.get('id')` for safer ID checks in response
- refactor message handling to support multiple message types
- refactor element finding methods for enhanced flexibility and clarity
- rename method for better clarity in captcha element handling
- refactor type hints for event callback parameters and options
- simplify ping call by inlining WebSocketClientProtocol cast
- refactor EventsManager to use typed Event objects consistently
- add runtime events management to the Tab class functionality
- update event callback signatures for better type handling
- remove unused import of Response in runtime_commands.py
- add Response import to page_commands for improved functionality
- refactor response classes to use TypedDict for better typing
- refactor WebElement class to organize exception imports clearly
- refactor exception handling in FindElementsMixin class
- refactor exception handling to use custom timeout and connection errors
- remove unused import statements in events_manager.py
- refactor error handling to use specific exceptions for clarity
- refactor error handling to use custom exception for arguments
- fix PermissionError raising in TempDirectoryManager class
- refactor error handling to use specific exceptions for clarity
- handle unsupported OS with a custom exception in Edge class
- raise UnsupportedOS exception for unsupported operating systems
- refactor browser error handling and improve method return types
- refactor exception classes to improve organization and clarity
- refactor element finding methods to use updated command structure
- refactor WebElement class for improved structure and clarity
- refactor import statements and clean up code formatting
- refactor command imports and enhance download behavior method
- refactor Tab import and update FetchCommands method calls
- refactor ConnectionHandler docstrings for clarity and conciseness
- refactor command and event managers for improved type safety
- refactor ConnectionHandler to improve WebSocket management and clarity
- add Tab class for managing browser tabs via CDP integration
- enhance TempDirectoryManager with detailed docstrings and type hints
- refactor ProxyManager to enhance proxy credential handling
- refactor Browser class to enhance automation capabilities and structure
- move commands to a different module
- define base structures for commands and responses in protocol
- import Rect from dom_commands_types for response handling
- refactor cookie-related types for improved clarity and consistency
- remove unnecessary whitespace in docstring of InputCommands class
- refactor DOM commands to improve structure and add functionality
- refactor InputCommands to enhance user input simulation methods
- add CookieParam TypedDict to define cookie attributes
- add new runtime command methods for JavaScript bindings and promises
- remove unused method to clear accepted encodings in network commands
- update ResetPermissionsParams to use NotRequired for context ID
- refactor PageCommands to improve structure and add type hints
- simplify import statements by using wildcard imports for responses
- add new response types and update existing response classes
- consolidate command imports using wildcard imports for clarity
- correct post_data type from dict to str in FetchCommands class
- refactor NetworkCommands to use structured command parameters
- refactor fetch command methods to use static methods directly
- refactor BrowserCommands to use static methods and improve clarity
- refactor response imports and update __all__ definitions
- refactor import statements for better readability and structure
- refactor import statements for consistency in response types
- refactor import and rename EnableParams to FetchEnableParams
- refactor import statement for CommandParams module path
- refactor fetch command templates to use Command class
- add enums for window states, download behaviors, and permissions
- remove unused enum imports and rename base_types module
- refactor command structures for better organization and clarity
- rename command and response modules for better clarity
- refactor imports for better organization and readability
- add browser command methods for version, permissions, and downloads
- add command and response types for protocol implementation
- refactor execute_command to use type annotations for clarity
- refactor command methods to specify response types in BrowserCommands
- refactor command structures and introduce base CommandParams class
- refactor browser command constants to use Command class type
- refactor connection imports and rename manager files for clarity
- refactor BrowserType import to a common constants module
- refactor browser modules to use the new chromium structure
- refactor element imports and remove deprecated element file
- refactor import paths to use the protocol submodule structure
- move command files to the protocol directory for better structure
- rename insert_text to paste_text and remove unused files
- refactor the `InputCommands` class to enhance clarity and simplicity in its operations
- add deprecation warning to get_element_text()

## 1.7.0 (2025-04-06)

### Feat

- refactor captcha handling with adjustable wait times and parameters

## 1.6.0 (2025-04-06)

### Feat

- add connect method to handle existing port scenarios
- create enable_auto_solve_cloudflare_captcha method
- add context manager to bypass Cloudflare Turnstile captcha

## 1.5.1 (2025-03-31)

### Fix

- handle headers input as list or dictionary in fetch command

## 1.5.0 (2025-03-26)

### Feat

- add flag to run browser on headless mode on start function

### Fix

- Wait for the file `CrashpadMetrics-active.pma` to be deoccupied and cleaned up
- Catch websockets.ConnectionClosed errors on duplicate close()
- move connection closed log inside if statement

## 1.4.0 (2025-03-23)

### Feat

- Update initialize_options method to allow optional browser_type parameter
- Refactor Edge browser options handling to use EdgeOptions class
- Supports initialization options based on browser type
- Edge browser constructors to support optional connection port parameters
- Add Microsoft Edge browser support
- 为 Edge 浏览器添加默认用户数据目录支持
- Add Microsoft Edge browser support

### Refactor

- Clean up imports and improve code formatting across browser modules
- Simplify user data directory setup and enhance Edge browser path handling

## 1.3.3 (2025-03-18)

### Fix

- solve browser invalid domain events issue
- improve process termination
- improve process management and deactivate websockets connection size limit

### Refactor

- import commands and evebts from __init__.py

## 1.3.2 (2025-03-13)

### Fix

- fixed the tests and used lint for the OS multi path support
- support multiple default Chrome paths on each OS

## 1.3.1 (2025-03-12)

### Fix

- remove unnecessary encoding from screenshot response data

## 1.3.0 (2025-03-12)

### Feat

- add method to retrieve screenshot as base64 encoded string

## 1.2.4 (2025-03-11)

### Fix

- refactor Chrome constructor to use Optional for parameters

## 1.2.3 (2025-03-11)

### Fix

- refactor proxy configuration retrieval for cleaner code flow

## 1.2.2 (2025-03-10)

### Fix

- Get file extension from file path and changes use of reserved word 'format' to 'fmt'

## 1.2.1 (2025-03-09)

### Fix

- resolve issue #29 where browser path was not found on macOS
- Quickstart code given in README is wrong

## 1.2.0 (2025-02-11)

### Feat

- add close method and command to Page class functionality

## 1.1.0 (2025-02-11)

### Feat

- add method to retrieve Page instance by its ID in Browser class

## 1.0.1 (2025-02-10)

### Fix

- add dialog property to ConnectionHandler and manage dialog state

## 1.0.0 (2025-02-05)

### BREAKING CHANGE

- now you'll have to use By.CSS_SELECTOR instead of By.CSS

### Feat

- refactor import and export statements for better readability
- update changelog for version 0.7.0 and fix dependency versions
- add ping method to ConnectionHandler for browser connectivity check
- add tests for BrowserCommands in test_browser_commands.py

### Fix

- add initial module files for commands, connection, events, and mixins
- add connection port parameter to Chrome browser initialization
- use deepcopy for templates to prevent mutation issues

### Refactor

- rename constant CSS to CSS_SELECTOR
- add command imports and remove obsolete connection handler code
- refactor methods to be static in ConnectionHandler class
- refactor proxy configuration and cleanup logic in Browser class
- refactor ConnectionHandler to improve WebSocket management logic
- refactor Browser class initialization for better clarity and structure
- refactor Browser initialization to enhance flexibility and defaults
- refactor import statement for ConnectionHandler module
- refactor import paths for ConnectionHandler in browser modules
- implement ConnectionHandler for WebSocket browser automation
- implement command and event management for asynchronous processing
- remove unnecessary logging for WebSocket address fetching
- refactor Chrome class to use BrowserOptionsManager for path validation
- implement proxy and browser management in the new managers module
- refactor Browser class to use manager classes for better structure
- refactor DOM command scripts for clarity and efficiency

## 0.7.0 (2024-12-09)

### Feat

- autoremove dialog from connection_handler when closed
- add handle_dialog method to PageCommands class
- add dialog handling methods to Page class
- add support for handling JavaScript dialog opening events
- refactor network response handling for base64 encoding support
- add clipping option for screenshots and implement element capture

### Fix

- index error on method get_dialog_message
- update screenshot format from 'jpg' to 'jpeg' for consistency
- handle potential IndexError when retrieving valid page targetId
- filter valid pages using URL condition instead of title check

### Refactor

- run ruff formatter to ensure code consistency
- run ruff formatter to ensure code consistency
- change screenshot format from PNG to JPG in commands and element

## 0.6.0 (2024-11-18)

### Feat

- add callback ID handling for page load events in Page class
- update event registration to return callback IDs and add removal
- refactor DOM commands to use object_id instead of node_id

### Fix

- refactor page navigation and loading logic for efficiency
- add page reload after navigating to a new URL in Page class
- refactor URL navigation to use evaluate_script for efficiency
- implement page refresh on URL unchanged and add navigation event
- update object ID reference in Page class for clarity
- refactor element search logic to simplify error handling
- DomCommands using `object_id` instead of `node_id` to prevent bugs
- handle OSError when cleaning up temporary directories in Browser

### Refactor

- change error log to warning for missing callback ID
- refactor DOM command scripts for improved readability and reuse
- rename methods for clarity and consistency in WebElement class
- refactor parameter names for consistency in target methods
- normalize variable naming for consistency in fetch commands

## 0.5.1 (2024-11-12)

### Fix

- simplify outer HTML retrieval for consistent object handling
- refactor click method to check option tag earlier in flow
- refactor bounding box retrieval to access nested response value
- handle KeyError instead of IndexError for element bounds retrieval
- enhance DOM command methods and rename for clarity and consistency
- add JavaScript bounding box retrieval for web elements
- remove redundant top-checks for element clicks in WebElement

## 0.5.0 (2024-11-11)

### Feat

- add method to generate command for calling a function on an object
- implement script execution and visibility checks in click method
- add JavaScript functions for element visibility and interaction

### Refactor

- enhance exception classes with descriptive error messages
- simplify command creation by using RuntimeCommands.evaluate_script
- refactor JavaScript execution and introduce runtime commands

## 0.4.4 (2024-11-11)

### Fix

- remove redundant DOM content loaded event handling logic

## 0.4.3 (2024-11-11)

### Fix

- rename event variables for clarity and improve timeout handling

### Refactor

- remove debug print statement from connection event handling

## 0.4.2 (2024-11-11)

### Fix

- update event handling to use DOM_CONTENT_LOADED for page load
- convert Browser context management to async methods

### Refactor

- fix string formatting in logger info message for clarity

## 0.4.1 (2024-11-08)

### Fix

- fixes workflow removing unnecessary hifen
- reduce sleep duration in key press handling for improved speed

## 0.4.0 (2024-11-08)

### Feat

- add type_keys method for realistic key input simulation

## 0.3.1 (2024-11-08)

### Fix

- addning new package version
- removing encode utf8 in get_pdf_base64

## 0.3.0 (2024-11-08)

### Feat

- set_download_path added in browser class methods

## 0.2.0 (2024-11-08)

### Feat

- dynamic lib version using pyproject

## 0.1.1 (2024-11-07)

### Fix

- ensure browser process terminates after executing close command

## 0.1.0 (2024-11-07)

### Feat

- add method to delete all cookies from the browser session
- add is_enabled property to check element's enabled status
- add option to raise exception in wait_element method
- add method to set browser download path via command
- refactor text extraction using BeautifulSoup for accuracy
- add method to get properties and improve XPath handling
- refactor text retrieval methods and improve code readability
- add timeout parameter to page navigation and loading methods
- add cookie management and scroll into view functionality
- add method to retrieve page PDF data as base64 string
- add async property to retrieve inner HTML of the element
- add async page_source property to retrieve page source code
- add async property to retrieve the current page URL
- add method to find multiple DOM elements using selectors
- refactor WebElement to use FindElementsMixin for clarity
- add FindElementsMixin for asynchronous DOM element handling
- add methods to retrieve network response bodies from logs
- add method to retrieve matching network logs from the page
- add cookie management methods to the Browser class
- add ElementNotFound exception to handle missing elements
- add value property and handle option tag clicks in WebElement
- rename FIND_ELEMENT_XPATH_TEMPLATE to EVALUATE_TEMPLATE
- add exception handling for element not found in find_element method
- downgrade Python version requirement to 3.10 in pyproject.toml
- add async function to fetch browser WebSocket address
- simplify text input handling by using insert_text command
- add TargetCommands class for managing target operations
- add method to generate command for disabling the Page domain
- add method to generate text insertion commands for inputs
- add Page class to manage browser page interactions and events
- add page management methods to the Browser class
- add detailed logging for command responses and event handling
- add event classes for browser, DOM, fetch, and network actions
- add NetworkCommands class for managing network operations
- implement fetch command methods for handling requests and responses
- add method to enable DOM domain events in DomCommands class
- add proxy configuration and fetch event handling to Browser
- refactor connection errors to use custom exceptions for clarity
- add methods to clear callbacks and close WebSocket connection
- remove unnecessary newline at the end of PageEvents class file
- add context managers and async file handling for efficiency
- implement singleton pattern and prevent multiple initializations
- add dynamic connection port handling for browser instance
- add temporary directory management for browser session storage
- add logging for connection events and command executions
- add PageEvents class with PAGE_LOADED event constant
- add temporary callback option to event registration method
- add page event handling and improve loading timeout management
- add utility function to decode base64 images to bytes
- add WebElement class for handling browser elements asynchronously
- add enumeration for selector types in constants module
- add PageCommands class for browser page control functions
- add InputCommands class for handling mouse and keyboard events
- implement DOM commands for interacting with web elements
- refactor BrowserCommands to include new window management methods
- implement some basic methods to navigate and control the browser instance
- enhance ConnectionHandler with detailed docstrings for methods
- add .gitignore, .python-version, and poetry.lock files

### Fix

- browser context now uses the storage commands to get cookies, while the page context us cookies, while page context uses network
- update cookie retrieval to use NetworkCommands for consistency
- remove download path method from Browser and add to Page class
- add options to disable first-run and browser check flags
- handle KeyError when retrieving network response bodies
- use get() to safely retrieve attributes in WebElement class
- rename class attribute retrieval for clarity and consistency
- enhance get_properties and simplify text retrieval method
- enhance create_web_element call with additional value parameter
- fix incorrect key access in JavaScript evaluation result
- update cookie management to clear browser cookies correctly
- filter pages by title instead of URL in Browser class
- filter out non-page entries when fetching valid page IDs
- xpath element solved
- refactor event callback storage to use unique callback IDs
- add JavaScript execution method and enhance click offsets
- simplify response handling and improve event callback structure
- reorder page event enabling to ensure proper browser startup
- add JSON handling and improve WebSocket command execution

### Refactor

- improve WebElement representation and handle None for nodeValue
- add newline at end of file for ElementNotFound exception class
- remove unused aiohttp import and clean up whitespace
- remove unnecessary blank lines in storage.py for clarity
- fix missing newline at the end of the file in page.py
- remove unnecessary whitespace in InputCommands class methods
- refactor DOM command methods for improved clarity and usability
- refactor Page class to inherit from FindElementsMixin
- refactor code to remove duplicate import of StorageCommands
- clarify error messages for command and callback validation
- refactor ConnectionHandler to simplify initialization and connect logic
- remove unnecessary whitespace in element.py for cleaner code
- refactor WebElement to enhance attribute retrieval methods
- refactor connection handling and improve error messaging
- refactor Browser class to use abstract base class and commands


================================================
FILE: CONTRIBUTING.md
================================================
# Contributing Guide

Thank you for your interest in contributing to the project! This document provides guidelines and instructions to help you contribute effectively.

## Table of Contents

- [Environment Setup](#environment-setup)
- [Development Workflow](#development-workflow)
- [Code Standards](#code-standards)
- [Testing](#testing)
- [Commit Messages](#commit-messages)
- [Pull Request Process](#pull-request-process)

## Environment Setup

### Prerequisites

- Python 3.10 or higher
- [Poetry](https://python-poetry.org/docs/#installation) for dependency management

### Installation

1. Clone the repository:
   ```bash
   git clone [REPOSITORY_URL]
   cd pydoll
   ```

2. Install dependencies using Poetry:
   ```bash
   poetry install
   ```

3. Activate the virtual environment:
   ```bash
   poetry shell
   ```

## Development Workflow

1. Create a new branch for your contribution:
   ```bash
   git checkout -b feature/your-feature-name
   ```
   or
   ```bash
   git checkout -b fix/your-fix-name
   ```

2. Make your changes following the code and testing guidelines.

3. Check your code using the linter:
   ```bash
   poetry run task lint
   ```

4. Format your code:
   ```bash
   poetry run task format
   ```

5. Run the tests to ensure everything is working:
   ```bash
   poetry run task test
   ```

6. Commit your changes following the commit conventions (see below).

7. Push your changes and open a Pull Request.

## Code Standards

This project uses [Ruff](https://github.com/charliermarsh/ruff) for linting and code formatting. The code standards are defined in the `pyproject.toml` file.

### Linting and Formatting

To check if your code follows the standards:

```bash
poetry run task lint
```

To automatically fix some issues and format your code:

```bash
poetry run task format
```

**Important:** Make sure to resolve all linting issues before submitting your changes. Code that doesn't pass the linting checks will not be accepted.

## Testing

### Writing Tests

For each new feature or modification, it is **mandatory** to write corresponding tests. We use `pytest` for testing.

- Tests should be placed in the `tests/` directory
- Test file names should start with `test_`
- Test function names should start with `test_`

### Running Tests

To run all tests:

```bash
poetry run task test
```

This will also generate a code coverage report (HTML) that can be viewed in the `htmlcov/` folder.

## Commit Messages

This project follows the [Conventional Commits](https://www.conventionalcommits.org/) standard for commit messages. We use the `commitizen` tool to facilitate the creation of standardized commits.

### Commit Message Structure

```
<type>[optional scope]: <description>

[optional body]

[optional footer(s)]
```

### Commit Types

- **feat**: A new feature
- **fix**: A bug fix
- **docs**: Documentation-only changes
- **style**: Changes that do not affect the meaning of the code (whitespace, formatting, etc.)
- **refactor**: A code change that neither fixes a bug nor adds a feature
- **perf**: A code change that improves performance
- **test**: Adding or correcting tests
- **build**: Changes that affect the build system or external dependencies
- **ci**: Changes to CI configuration files
- **chore**: Other changes that don't modify src or test files

### Examples of Good Commit Messages

```
feat(parser): add ability to parse arrays
```

```
fix(networking): resolve connection timeout issue

A problem was identified in the networking library that
caused unexpected timeouts. This change increases the
default timeout from 10s to 30s.
```

## Pull Request Process

1. Verify that your code passes all tests and linting checks.
2. Push your branch to the repository.
3. Open a Pull Request to the main branch.
4. In the PR description, clearly explain what was changed and why.
5. Link any related issues to your PR.
6. Wait for the code review. Read the comments and make necessary changes.

## Questions?

If you have questions or need help, open an issue in the repository or contact the project maintainers.

---

We appreciate your contributions to make this project better! 

================================================
FILE: LICENSE
================================================
The MIT License (MIT)

Copyright © 2025 AutoscrapeLabs

Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the “Software”), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED “AS IS”, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.


================================================
FILE: README.md
================================================
<p align="center">
    <img src="https://github.com/user-attachments/assets/2c380638-b04a-4b04-b1c8-2958e4237a94" alt="Pydoll Logo" /> <br>
</p>
<p align="center">Async-native, fully typed, built for evasion and performance.</p>

<p align="center">
    <a href="https://github.com/autoscrape-labs/pydoll/stargazers"><img src="https://img.shields.io/github/stars/autoscrape-labs/pydoll?style=social"></a>
    <a href="https://codecov.io/gh/autoscrape-labs/pydoll" >
        <img src="https://codecov.io/gh/autoscrape-labs/pydoll/graph/badge.svg?token=40I938OGM9"/>
    </a>
    <img src="https://github.com/autoscrape-labs/pydoll/actions/workflows/tests.yml/badge.svg" alt="Tests">
    <img src="https://github.com/autoscrape-labs/pydoll/actions/workflows/ruff-ci.yml/badge.svg" alt="Ruff CI">
    <img src="https://github.com/autoscrape-labs/pydoll/actions/workflows/mypy.yml/badge.svg" alt="MyPy CI">
    <img src="https://img.shields.io/badge/python-%3E%3D3.10-blue" alt="Python >= 3.10">
    <a href="https://deepwiki.com/autoscrape-labs/pydoll"><img src="https://deepwiki.com/badge.svg" alt="Ask DeepWiki"></a>
</p>

<p align="center">
    <a href="https://pydoll.tech/">Documentation</a> &middot;
    <a href="#getting-started">Getting Started</a> &middot;
    <a href="#features">Features</a> &middot;
    <a href="#support">Support</a>
</p>

Pydoll automates Chromium-based browsers (Chrome, Edge) by connecting directly to the Chrome DevTools Protocol over WebSocket. No WebDriver binary, no `navigator.webdriver` flag, no compatibility issues.

It combines a high-level API for common tasks with low-level CDP access for fine-grained control over network, fingerprinting, and browser behavior. The entire codebase is async-native and fully type-checked with mypy.

### Top Sponsors

<a href="https://substack.thewebscraping.club/p/pydoll-webdriver-scraping?utm_source=github&utm_medium=repo&utm_campaign=pydoll">
    <img src="public/images/banner-the-webscraping-club.png" alt="The Web Scraping Club" />
</a>

<sub>Read a full review of Pydoll on <b><a href="https://substack.thewebscraping.club/p/pydoll-webdriver-scraping?utm_source=github&utm_medium=repo&utm_campaign=pydoll">The Web Scraping Club</a></b>, the #1 newsletter dedicated to web scraping.</sub>

### Sponsors

<table>
  <tr>
    <td><a href="https://www.thordata.com/?ls=github&lk=pydoll"><img src="public/images/Thordata-logo.png" height="30" alt="Thordata" /></a></td>
    <td><a href="https://dashboard.capsolver.com/passport/register?inviteCode=WPhTbOsbXEpc"><img src="public/images/capsolver-logo.png" height="40" alt="CapSolver" /></a></td>
    <td><a href="https://www.testmuai.com/?utm_medium=sponsor&utm_source=pydoll"><img src="public/images/logo-lamda-test.svg" height="30" width="130" alt="LambdaTest" /></a></td>
  </tr>
</table>

<sub>[Learn more about our sponsors](SPONSORS.md) &middot; [Become a sponsor](https://github.com/sponsors/thalissonvs)</sub>

### Why Pydoll

- **Stealth-first**: Human-like mouse movement, realistic typing, and granular [browser preference](https://pydoll.tech/docs/features/configuration/browser-preferences/) control for fingerprint management.
- **Async and typed**: Built on `asyncio` from the ground up, 100% type-checked with `mypy`. Full IDE autocompletion and static error checking.
- **Network control**: [Intercept](https://pydoll.tech/docs/features/network/interception/) requests to block ads/trackers, [monitor](https://pydoll.tech/docs/features/network/monitoring/) traffic for API discovery, and make [authenticated HTTP requests](https://pydoll.tech/docs/features/network/http-requests/) that inherit the browser session.
- **Shadow DOM and iframes**: Full support for [shadow roots](https://pydoll.tech/docs/deep-dive/architecture/shadow-dom/) (including closed) and cross-origin iframes. Discover, query, and interact with elements inside them using the same API.
- **Ergonomic API**: `tab.find()` for most cases, `tab.query()` for complex [CSS/XPath selectors](https://pydoll.tech/docs/deep-dive/guides/selectors-guide/).

## Installation

```bash
pip install pydoll-python
```

No WebDriver binaries or external dependencies required.

## What's New

<details>
<summary><b>HAR Network Recording</b></summary>
<br>

Record network activity during a browser session and export as HAR 1.2. Replay recorded requests to reproduce exact API sequences.

```python
from pydoll.browser.chromium import Chrome

async with Chrome() as browser:
    tab = await browser.start()

    async with tab.request.record() as capture:
        await tab.go_to('https://example.com')

    capture.save('flow.har')
    print(f'Captured {len(capture.entries)} requests')

    responses = await tab.request.replay('flow.har')
```

Filter by resource type:

```python
from pydoll.protocol.network.types import ResourceType

async with tab.request.record(
    resource_types=[ResourceType.FETCH, ResourceType.XHR]
) as capture:
    await tab.go_to('https://example.com')
```

[HAR Recording Docs](https://pydoll.tech/docs/features/network/network-recording/)
</details>

<details>
<summary><b>Page Bundles</b></summary>
<br>

Save the current page and all its assets (CSS, JS, images, fonts) as a `.zip` bundle for offline viewing. Optionally inline everything into a single HTML file.

```python
await tab.save_bundle('page.zip')
await tab.save_bundle('page-inline.zip', inline_assets=True)
```

[Screenshots, PDFs & Bundles Docs](https://pydoll.tech/docs/features/automation/screenshots-and-pdfs/)
</details>

<details>
<summary><b>Shadow DOM Support</b></summary>
<br>

Full Shadow DOM support, including closed shadow roots. Because Pydoll operates at the CDP level (below JavaScript), the `closed` mode restriction doesn't apply.

```python
shadow = await element.get_shadow_root()
button = await shadow.query('.internal-btn')
await button.click()

# Discover all shadow roots on the page
shadow_roots = await tab.find_shadow_roots()
for sr in shadow_roots:
    checkbox = await sr.query('input[type="checkbox"]', raise_exc=False)
    if checkbox:
        await checkbox.click()
```

Highlights:
- Closed shadow roots work without workarounds
- `find_shadow_roots()` discovers every shadow root on the page
- `timeout` parameter for polling until shadow roots appear
- `deep=True` traverses cross-origin iframes (OOPIFs)
- Standard `find()`, `query()`, `click()` API inside shadow roots

```python
# Cloudflare Turnstile inside a cross-origin iframe
shadow_roots = await tab.find_shadow_roots(deep=True, timeout=10)
for sr in shadow_roots:
    checkbox = await sr.query('input[type="checkbox"]', raise_exc=False)
    if checkbox:
        await checkbox.click()
```

[Shadow DOM Docs](https://pydoll.tech/docs/deep-dive/architecture/shadow-dom/)
</details>

<details>
<summary><b>Humanized Mouse Movement</b></summary>
<br>

Mouse operations produce human-like cursor movement by default:

- **Bezier curve paths** with asymmetric control points
- **Fitts's Law timing**: duration scales with distance
- **Minimum-jerk velocity**: bell-shaped speed profile
- **Physiological tremor**: Gaussian noise scaled with velocity
- **Overshoot correction**: ~70% chance on fast movements, then corrects back

```python
await tab.mouse.move(500, 300)
await tab.mouse.click(500, 300)
await tab.mouse.drag(100, 200, 500, 400)

button = await tab.find(id='submit')
await button.click()

# Opt out when speed matters
await tab.mouse.click(500, 300, humanize=False)
```

[Mouse Control Docs](https://pydoll.tech/docs/features/automation/mouse-control/)
</details>

## Getting Started

```python
import asyncio
from pydoll.browser import Chrome
from pydoll.constants import Key

async def google_search(query: str):
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://www.google.com')

        search_box = await tab.find(tag_name='textarea', name='q')
        await search_box.insert_text(query)
        await tab.keyboard.press(Key.ENTER)

        first_result = await tab.find(
            tag_name='h3',
            text='autoscrape-labs/pydoll',
            timeout=10,
        )
        await first_result.click()

        await tab.find(id='repository-container-header', timeout=10)
        print(f"Page loaded: {await tab.title}")

asyncio.run(google_search('pydoll site:github.com'))
```

## Features

<details>
<summary><b>Hybrid Automation (UI + API)</b></summary>
<br>

Use UI automation to pass login flows (CAPTCHAs, JS challenges), then switch to `tab.request` for fast API calls that inherit the full browser session: cookies, headers, and all.

```python
# Log in via UI
await tab.go_to('https://my-site.com/login')
await (await tab.find(id='username')).type_text('user')
await (await tab.find(id='password')).type_text('pass123')
await (await tab.find(id='login-btn')).click()

# Make authenticated API calls using the browser session
response = await tab.request.get('https://my-site.com/api/user/profile')
user_data = response.json()
```
[Hybrid Automation Docs](https://pydoll.tech/docs/features/network/http-requests/)
</details>

<details>
<summary><b>Network Interception and Monitoring</b></summary>
<br>

Monitor traffic for API discovery or intercept requests to block ads, trackers, and unnecessary resources.

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent
from pydoll.protocol.network.types import ErrorReason

async def block_images():
    async with Chrome() as browser:
        tab = await browser.start()

        async def block_resource(event: RequestPausedEvent):
            request_id = event['params']['requestId']
            resource_type = event['params']['resourceType']

            if resource_type in ['Image', 'Stylesheet']:
                await tab.fail_request(request_id, ErrorReason.BLOCKED_BY_CLIENT)
            else:
                await tab.continue_request(request_id)

        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, block_resource)

        await tab.go_to('https://example.com')
        await asyncio.sleep(3)
        await tab.disable_fetch_events()

asyncio.run(block_images())
```
[Network Monitoring](https://pydoll.tech/docs/features/network/monitoring/) | [Request Interception](https://pydoll.tech/docs/features/network/interception/)
</details>

<details>
<summary><b>Browser Fingerprint Control</b></summary>
<br>

Granular control over [browser preferences](https://pydoll.tech/docs/features/configuration/browser-preferences/): hundreds of internal Chrome settings for building consistent fingerprints.

```python
options = ChromiumOptions()

options.browser_preferences = {
    'profile': {
        'default_content_setting_values': {
            'notifications': 2,
            'geolocation': 2,
        },
        'password_manager_enabled': False
    },
    'intl': {
        'accept_languages': 'en-US,en',
    },
    'browser': {
        'check_default_browser': False,
    }
}
```
[Browser Preferences Guide](https://pydoll.tech/docs/features/configuration/browser-preferences/)
</details>

<details>
<summary><b>Concurrency, Contexts and Remote Connections</b></summary>
<br>

Manage [multiple tabs](https://pydoll.tech/docs/features/browser-management/tabs/) and [browser contexts](https://pydoll.tech/docs/features/browser-management/contexts/) (isolated sessions) concurrently. Connect to browsers running in Docker or remote servers.

```python
async def scrape_page(url, tab):
    await tab.go_to(url)
    return await tab.title

async def concurrent_scraping():
    async with Chrome() as browser:
        tab_google = await browser.start()
        tab_ddg = await browser.new_tab()

        results = await asyncio.gather(
            scrape_page('https://google.com/', tab_google),
            scrape_page('https://duckduckgo.com/', tab_ddg)
        )
        print(results)
```
[Multi-Tab Management](https://pydoll.tech/docs/features/browser-management/tabs/) | [Remote Connections](https://pydoll.tech/docs/features/advanced/remote-connections/)
</details>

<details>
<summary><b>Retry Decorator</b></summary>
<br>

The `@retry` decorator supports custom recovery logic between attempts (e.g., refreshing the page, rotating proxies) and exponential backoff.

```python
from pydoll.decorators import retry
from pydoll.exceptions import ElementNotFound, NetworkError

@retry(
    max_retries=3,
    exceptions=[ElementNotFound, NetworkError],
    on_retry=my_recovery_function,
    exponential_backoff=True
)
async def scrape_product(self, url: str):
    # scraping logic
    ...
```
[Retry Decorator Docs](https://pydoll.tech/docs/features/advanced/decorators/)
</details>

---

## Contributing

Contributions are welcome. See [CONTRIBUTING.md](CONTRIBUTING.md) for guidelines.

## Support

If you find Pydoll useful, consider [sponsoring the project on GitHub](https://github.com/sponsors/thalissonvs).

## License

[MIT License](LICENSE)


================================================
FILE: README_zh.md
================================================
<p align="center">
    <img src="https://github.com/user-attachments/assets/219f2dbc-37ed-4aea-a289-ba39cdbb335d" alt="Pydoll Logo" /> <br>
</p>
<h1 align="center">Pydoll: Automate the Web, Naturally</h1>

<p align="center">
    <a href="https://github.com/autoscrape-labs/pydoll/stargazers"><img src="https://img.shields.io/github/stars/autoscrape-labs/pydoll?style=social"></a>
    <a href="https://codecov.io/gh/autoscrape-labs/pydoll" >
        <img src="https://codecov.io/gh/autoscrape-labs/pydoll/graph/badge.svg?token=40I938OGM9"/>
    </a>
    <img src="https://github.com/thalissonvs/pydoll/actions/workflows/tests.yml/badge.svg" alt="Tests">
    <img src="https://github.com/thalissonvs/pydoll/actions/workflows/ruff-ci.yml/badge.svg" alt="Ruff CI">
    <img src="https://github.com/thalissonvs/pydoll/actions/workflows/mypy.yml/badge.svg" alt="MyPy CI">
    <img src="https://img.shields.io/badge/python-%3E%3D3.10-blue" alt="Python >= 3.10">
    <a href="https://deepwiki.com/autoscrape-labs/pydoll"><img src="https://deepwiki.com/badge.svg" alt="Ask DeepWiki"></a>
</p>


<p align="center">
  📖 <a href="https://autoscrape-labs.github.io/pydoll/">文档</a> •
  🚀 <a href="#-getting-started">快速上手</a> •
  ⚡ <a href="#-advanced-features">高级特性</a> •
  🤝 <a href="#-contributing">贡献</a> •
  💖 <a href="#-support-my-work">赞助我</a>
</p>

- [English](README.md)

设想以下场景：你需要实现浏览器任务的自动化操作——无论是测试Web应用程序、从网站采集数据，还是批量处理重复性流程。传统方法往往需要配置外部驱动程序、进行复杂的系统设置，还可能面临诸多兼容性问题。

**Pydoll的诞生就是解决这些问题!!!**

Pydoll 采用全新设计理念，从零构建，直接对接 Chrome DevTools Protocol（CDP），无需依赖外部驱动。 这种精简的实现方式，结合高度拟真的点击、导航及元素交互机制，使其行为与真实用户几乎毫无区别。

我们坚信，真正强大的自动化工具，不应让用户困于繁琐的配置学习，也不该让用户疲于应对反爬系统的风控。使用Pydoll，你只需专注核心业务逻辑——让自动化回归本质，而非纠缠于底层技术细节或防护机制。

<div>
  <h4>做一个好人，给我们一个星星 ⭐</h4> 
    没有星星，就没有Bug修复。开玩笑的（也许）
</div>

## 🌟 Pydoll 的核心优势

- **零 WebDriver 依赖**：彻底告别驱动兼容性烦恼
- **类人交互引擎**：能够通过行为验证码如 reCAPTCHA v3 或 Turnstile，取决于 IP 声誉和交互模式
- **异步高性能**：支持高速自动化与多任务并行处理
- **拟真交互体验**：完美复刻真实用户行为模式
- **极简部署**：安装即用，开箱即自动化

## 最新功能

### 类人页面滚动 —— 像真实用户一样滚动！

现在你可以控制页面滚动，支持平滑动画并自动等待完成：

```python
from pydoll.constants import ScrollPosition

# 带平滑动画向下滚动（等待完成）
await tab.scroll.by(ScrollPosition.DOWN, 500, smooth=True)

# 导航至特定位置
await tab.scroll.to_bottom(smooth=True)
await tab.scroll.to_top(smooth=True)

# 需要速度时的即时滚动
await tab.scroll.by(ScrollPosition.UP, 300, smooth=False)
```

不同于立即返回的 `execute_script("window.scrollBy(...)")`，滚动API使用CDP的`awaitPromise`等待浏览器的`scrollend`事件，确保后续操作仅在滚动完全完成后执行。非常适合截取屏幕截图、加载延迟内容或创建真实的阅读模式。

### 键盘 API —— 完全控制键盘输入

全新的 `KeyboardAPI` 为页面级别的所有键盘交互提供了简洁、集中的接口：

```python
from pydoll.constants import Key

# 按单个键
await tab.keyboard.press(Key.ENTER)
await tab.keyboard.press(Key.TAB)

# 使用快捷键/组合键（最多3个键）
await tab.keyboard.hotkey(Key.CONTROL, Key.A)  # 全选（有效！）
await tab.keyboard.hotkey(Key.CONTROL, Key.C)  # 复制（有效！）
await tab.keyboard.hotkey(Key.CONTROL, Key.SHIFT, Key.ARROWRIGHT)  # 向右选择单词

# 复杂序列的手动控制
await tab.keyboard.down(Key.SHIFT)
await tab.keyboard.press(Key.ARROWRIGHT)  # 按住 Shift 选择文本
await tab.keyboard.up(Key.SHIFT)
```

**主要改进：**
- **集中化**：所有键盘操作通过 `tab.keyboard` 访问
- **智能修饰键检测**：快捷键自动检测并应用修饰键（Ctrl、Shift、Alt、Meta）
- **完整按键支持**：26个字母（A-Z）、10个数字（0-9）、所有功能键、数字键盘和特殊键
- **页面级快捷键**：适用于 Ctrl+C、Ctrl+V、Ctrl+A 等（由于 CDP 限制，浏览器 UI 快捷键不起作用）

> **⚠️ CDP 限制：** 浏览器 UI 快捷键（如 Ctrl+T 打开新标签，F12 打开开发者工具）通过 CDP 无法使用。请改用 Pydoll 的方法：`await browser.new_tab()`、`await tab.close()`。

### Retry 装饰器：生产级错误恢复

使用 `@retry` 装饰器将脆弱的脚本转变为强大的生产级爬虫。通过指数退避和自定义恢复策略，自动从网络故障、超时和临时错误中恢复：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.decorators import retry
from pydoll.exceptions import ElementNotFound, NetworkError

class ProductScraper:
    def __init__(self):
        self.tab = None
        self.retry_count = 0
    
    # 在每次重试前执行的恢复回调
    async def recover_from_failure(self):
        self.retry_count += 1
        print(f"尝试 {self.retry_count} 失败。恢复中...")
        
        # 刷新页面并恢复状态
        if self.tab:
            await self.tab.refresh()
            await asyncio.sleep(2)
    
    @retry(
        max_retries=3,
        exceptions=[ElementNotFound, NetworkError],
        on_retry=recover_from_failure,  # 执行恢复逻辑
        delay=2.0,
        exponential_backoff=True
    )
    async def scrape_product(self, url: str):
        if not self.tab:
            browser = Chrome()
            self.tab = await browser.start()
        
        await self.tab.go_to(url)
        title = await self.tab.find(class_name='product-title', timeout=5)
        return await title.text
```

**强大功能：**
- **智能重试逻辑**：仅对您定义的特定异常重试
- **指数退避**：逐步增加等待时间（1秒 → 2秒 → 4秒 → 8秒）
- **恢复回调**：在重试之间执行自定义逻辑（刷新页面、切换代理、重启浏览器）
- **生产验证**：自信地处理真实世界爬虫的混乱情况

非常适合处理速率限制、网络不稳定、动态内容加载和验证码检测。将不可靠的爬虫转变为防弹自动化。

[**📖 完整文档**](https://pydoll.tech/docs/zh/features/advanced/decorators/)

### 通过 WebSocket 进行远程连接 —— 随时随地控制浏览器！

现在你可以使用浏览器的 WebSocket 地址直接连接到已运行的实例，并立即使用完整的 Pydoll API：

```python
from pydoll.browser.chromium import Chrome

chrome = Chrome()
tab = await chrome.connect('ws://YOUR_HOST:9222/devtools/browser/XXXX')

# 直接开干：导航、元素自动化、请求、事件…
await tab.go_to('https://example.com')
title = await tab.execute_script('return document.title')
print(title)
```

这让你可以轻松对接远程/CI 浏览器、容器或共享调试目标——无需本地启动，只需指向 WS 端点即可自动化。

### 像专业人士一样漫游 DOM：get_children_elements() 与 get_siblings_elements()

两个让复杂布局遍历更优雅的小助手：

```python
# 获取容器的直接子元素
container = await tab.find(id='cards')
cards = await container.get_children_elements(max_depth=1)

# 想更深入？这将返回子元素的子元素（以此类推）
elements = await container.get_children_elements(max_depth=2) 

# 在横向列表中无痛遍历兄弟元素
active = await tab.find(class_name='item--active')
siblings = await active.get_siblings_elements()

print(len(cards), len(siblings))
```

用更少样板代码表达更多意图，特别适合动态网格、列表与菜单的场景，让抓取/自动化逻辑更清晰、更可读。

### WebElement：状态等待与新的公共 API

- 新增 `wait_until(...)` 用于等待元素状态，使用更简单：

```python
# 等待元素变为可见，直到超时
await element.wait_until(is_visible=True, timeout=5)

# 等待元素变为可交互（可见、位于顶层并可接收事件）
await element.wait_until(is_interactable=True, timeout=10)
```

- 以下 `WebElement` 方法现已公开：
  - `is_visible()`
    - 判断元素是否具有可见区域、未被 CSS 隐藏，并在需要时滚动进入视口。适用于交互前的快速校验。
  - `is_interactable()`
    - “可点击”状态：综合可见性、启用状态与指针事件命中等条件，适合构建更稳健的交互流程。
  - `is_on_top()`
    - 检查元素在点击位置是否为顶部命中目标，避免被覆盖导致点击失效。
  - `execute_script(script: str, return_by_value: bool = False)`
    - 在元素上下文中执行 JavaScript（this 指向该元素），便于细粒度调整与快速检查。

```python
# 使用 JS 高亮元素
await element.execute_script("this.style.outline='2px solid #22d3ee'")

# 校验状态
visible = await element.is_visible()
interactable = await element.is_interactable()
on_top = await element.is_on_top()
```

以上新增能力能显著简化“等待+验证”场景，降低自动化过程中的不稳定性，使用例更可预测。

### 浏览器上下文 HTTP 请求 - 混合自动化的游戏规则改变者！
你是否曾经希望能够发出自动继承浏览器所有会话状态的 HTTP 请求？**现在你可以了！**<br>
`tab.request` 属性为你提供了一个美观的 `requests` 风格接口，可在浏览器的 JavaScript 上下文中直接执行 HTTP 调用。这意味着每个请求都会自动获得 cookies、身份验证标头、CORS 策略和会话状态，就像浏览器本身发出请求一样。

**混合自动化的完美选择：**
```python
# 使用 PyDoll 正常导航到网站并登录
await tab.go_to('https://example.com/login')
await (await tab.find(id='username')).type_text('user@example.com')
await (await tab.find(id='password')).type_text('password')
await (await tab.find(id='login-btn')).click()

# 现在发出继承已登录会话的 API 调用！
response = await tab.request.get('https://example.com/api/user/profile')
user_data = response.json()

# 在保持身份验证的同时 POST 数据
response = await tab.request.post(
    'https://example.com/api/settings', 
    json={'theme': 'dark', 'notifications': True}
)

# 以不同格式访问响应内容
raw_data = response.content
text_data = response.text
json_data = response.json()

# 检查设置的 cookies
for cookie in response.cookies:
    print(f"Cookie: {cookie['name']} = {cookie['value']}")

# 向你的请求添加自定义标头
headers = [
    {'name': 'X-Custom-Header', 'value': 'my-value'},
    {'name': 'X-API-Version', 'value': '2.0'}
]

await tab.request.get('https://api.example.com/data', headers=headers)

```

**为什么这很棒：**
- **无需会话切换** - 请求自动继承浏览器 cookies
- **CORS 无缝工作** - 请求遵循浏览器安全策略  
- **现代 SPA 的完美选择** - 无缝混合 UI 自动化与 API 调用
- **身份验证变得简单** - 通过 UI 登录一次，然后调用 API
- **混合工作流** - 为每个步骤使用最佳工具（UI 或 API）

这为需要浏览器交互和 API 效率的自动化场景开启了令人难以置信的可能性！

### 使用自定义首选项完全控制浏览器！(感谢 [@LucasAlvws](https://github.com/LucasAlvws))
想要完全自定义 Chrome 的行为？**现在你可以控制一切！**<br>
新的 `browser_preferences` 系统让你可以访问数百个之前无法通过编程方式更改的内部 Chrome 设置。我们说的是远超命令行标志的深度浏览器自定义！

**可能性是无限的：**
```python
options = ChromiumOptions()

# 创建完美的自动化环境
options.browser_preferences = {
    'download': {
        'default_directory': '/tmp/downloads',
        'prompt_for_download': False,
        'directory_upgrade': True,
        'extensions_to_open': ''  # 不自动打开任何下载
    },
    'profile': {
        'default_content_setting_values': {
            'notifications': 2,        # 阻止所有通知
            'geolocation': 2,         # 阻止位置请求
            'media_stream_camera': 2, # 阻止摄像头访问
            'media_stream_mic': 2,    # 阻止麦克风访问
            'popups': 1               # 允许弹窗（对自动化有用）
        },
        'password_manager_enabled': False,  # 禁用密码提示
        'exit_type': 'Normal'              # 始终正常退出
    },
    'intl': {
        'accept_languages': 'zh-CN,zh,en-US,en',
        'charset_default': 'UTF-8'
    },
    'browser': {
        'check_default_browser': False,    # 不询问默认浏览器
        'show_update_promotion_infobar': False
    }
}

# 或使用便捷的辅助方法
options.set_default_download_directory('/tmp/downloads')
options.set_accept_languages('zh-CN,zh,en-US,en')  
options.prompt_for_download = False
```

**实际应用的强大示例：**
- **静默下载** - 无提示、无对话框，只有自动化下载
- **阻止所有干扰** - 通知、弹窗、摄像头请求，应有尽有
- **CI/CD 的完美选择** - 禁用更新检查、默认浏览器提示、崩溃报告
- **多区域测试** - 即时更改语言、时区和区域设置
- **安全加固** - 锁定权限并禁用不必要的功能
- **高级指纹控制** - 修改浏览器安装日期、参与历史和行为模式

**用于隐蔽自动化的指纹自定义：**
```python
import time

# 模拟一个已经存在几个月的浏览器
fake_engagement_time = int(time.time()) - (7 * 24 * 60 * 60)  # 7天前

options.browser_preferences = {
    'settings': {
        'touchpad': {
            'natural_scroll': True,
        }
    },
    'profile': {
        'last_engagement_time': fake_engagement_time,
        'exit_type': 'Normal',
        'exited_cleanly': True
    },
    'newtab_page_location_override': 'https://www.google.com',
    'session': {
        'restore_on_startup': 1,  # 恢复上次会话
        'startup_urls': ['https://www.google.com']
    }
}
```

这种控制级别以前只有 Chrome 扩展开发者才能使用 - 现在它在你的自动化工具包中！

查看[文档](https://pydoll.tech/docs/zh/features/#custom-browser-preferences/)了解更多详情。

### 新的 `get_parent_element()` 方法
检索任何 WebElement 的父元素，使导航 DOM 结构更加容易：
```python
element = await tab.find(id='button')
parent = await element.get_parent_element()
```

### 新的 start_timeout 选项 (感谢 [@j0j1j2](https://github.com/j0j1j2))
添加到 ChromiumOptions 来控制浏览器启动可以花费多长时间。在较慢的机器或 CI 环境中很有用。

```python
options = ChromiumOptions()
options.start_timeout = 20  # 等待 20 秒
```

### 新的 expect_download() 上下文管理器 —— 稳健、优雅的文件下载！
还在为不稳定的下载流程、丢失的文件或混乱的事件监听而头疼吗？`tab.expect_download()` 来了：一种可靠、简洁的下载方式。

- 自动配置浏览器下载行为
- 支持自定义下载目录或临时目录（自动清理！）
- 内置超时等待，防止任务卡住
- 提供便捷句柄：读取字节/BASE64，获取 `file_path`

一个“开箱即用”的小示例：

```python
import asyncio
from pathlib import Path
from pydoll.browser import Chrome

async def download_report():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/reports')

        target_dir = Path('/tmp/my-downloads')
        async with tab.expect_download(keep_file_at=target_dir, timeout=10) as dl:
            # 触发页面上的下载（按钮/链接等）
            await (await tab.find(text='Download latest report')).click()

            # 等待完成并读取内容
            data = await dl.read_bytes()
            print(f"已下载 {len(data)} 字节，保存至: {dl.file_path}")

asyncio.run(download_report())
```

想要“零成本清理”？不传 `keep_file_at` 即可——我们会创建临时目录，并在上下文退出后自动清理。对测试场景非常友好。

## 📦 安装

```bash
pip install pydoll-python
```

就这么简单！安装即用，马上开始自动化

## 🚀 快速上手

### 你的第一个自动化任务

让我们从一个实际例子开始：一个自动执行谷歌搜索并点击第一个结果的自动化流程。通过这个示例，你可以了解该库的工作原理，以及如何开始将日常任务自动化。

```python
import asyncio

from pydoll.browser import Chrome
from pydoll.constants import Key

async def google_search(query: str):
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://www.google.com')
        search_box = await tab.find(tag_name='textarea', name='q')
        await search_box.insert_text(query)
        await tab.keyboard.press(Key.ENTER)
        await (await tab.find(
            tag_name='h3',
            text='autoscrape-labs/pydoll',
            timeout=10,
        )).click()
        await tab.find(id='repository-container-header', timeout=10)

asyncio.run(google_search('pydoll site:github.com'))
```

无需任何配置，只需一个简单脚本，我们就能完成一次完整的谷歌搜索！
好了，现在让我们看看如何从网页中提取数据，依然沿用之前的示例。

假设在以下代码中，我们已经进入了 Pydoll 项目页面。我们需要提取以下信息：

- 项目描述
- 星标数量
- Fork 数量
- Issue 数量
- Pull Request 数量
如果想要获取项目描述，我们将使用 XPath 查询。你可以查阅相关文档，学习如何构建自己的查询语句。

```python
description = await (await tab.query(
    '//h2[contains(text(), "About")]/following-sibling::p',
    timeout=10,
)).text
```

下面让我们来理解这条查询语句的作用：

1. `//h2[contains(text(), "About")]` - 选择第一个包含"About"的 `<h2>` 标签
2. `/following-sibling::p` - 选择第一个在`<h2>` 标签之后的`<p>`标签

然后你可以获取到剩下的数据：

```python
number_of_stars = await (await tab.find(
    id='repo-stars-counter-star'
)).text

number_of_forks = await (await tab.find(
    id='repo-network-counter'
)).text
number_of_issues = await (await tab.find(
    id='issues-repo-tab-count',
)).text
number_of_pull_requests = await (await tab.find(
    id='pull-requests-repo-tab-count',
)).text

data = {
    'description': description,
    'number_of_stars': number_of_stars,
    'number_of_forks': number_of_forks,
    'number_of_issues': number_of_issues,
    'number_of_pull_requests': number_of_pull_requests,
}
print(data)

```

下图展示了本次自动化任务的执行速度与结果。
（为演示需要，浏览器界面未显示。）

![google_seach](./docs/images/google-search-example.gif)


短短5秒内，我们就成功提取了所需数据！  
这就是使用Pydoll进行自动化所能达到的速度。

### 更多复杂的例子

接下来我们来看一个你可能经常遇到的场景：类似Cloudflare的验证码防护。  
Pydoll提供了相应的处理方法，但需要说明的是，正如前文所述，其有效性会受到多种因素影响。  
下面的代码展示了一个完整的Cloudflare验证码处理示例。

```python
import asyncio

from pydoll.browser import Chrome
from pydoll.constants import By

async def cloudflare_example():
    async with Chrome() as browser:
        tab = await browser.start()
        async with tab.expect_and_bypass_cloudflare_captcha():
            await tab.go_to('https://2captcha.com/demo/cloudflare-turnstile')
        print('Captcha handled, continuing...')
        await asyncio.sleep(5)  # just to see the result :)

asyncio.run(cloudflare_example())

```

执行结果如下：

![cloudflare_example](./docs/images/cloudflare-example.gif)


仅需数行代码，我们就成功攻克了最棘手的验证码防护之一。
而这仅仅是Pydoll所提供的众多强大功能之一。但这还远不是全部！


### 自定义配置

有时我们需要对浏览器进行更精细的控制。Pydoll提供了灵活的配置方式来实现这一点。下面我们来看具体示例：


```python
from pydoll.browser import Chrome
from pydoll.browser.options import ChromiumOptions as Options

async def custom_automation():
    # Configure browser options
    options = Options()
    options.add_argument('--proxy-server=username:password@ip:port')
    options.add_argument('--window-size=1920,1080')
    options.binary_location = '/path/to/your/browser'
    options.start_timeout = 20

    async with Chrome(options=options) as browser:
        tab = await browser.start()
        # Your automation code here
        await tab.go_to('https://example.com')
        # The browser is now using your custom settings

asyncio.run(custom_automation())
```

本示例中，我们配置浏览器使用代理服务器，并设置窗口分辨率为1920x1080。此外，还指定了Chrome二进制文件的自定义路径——适用于您的安装位置与常规默认路径不同的情况。

## ⚡ 高级功能

Pydoll提供了一系列高级特性满足高端玩家的需求。


### 高级元素定位

我们提供多种页面元素定位方式。无论您偏好那种方法，都能找到适合您的解决方案：

```python
import asyncio
from pydoll.browser import Chrome

async def element_finding_examples():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')

        # Find by attributes (most intuitive)
        submit_btn = await tab.find(
            tag_name='button',
            class_name='btn-primary',
            text='Submit'
        )
        # Find by ID
        username_field = await tab.find(id='username')
        # Find multiple elements
        all_links = await tab.find(tag_name='a', find_all=True)
        # CSS selectors and XPath
        nav_menu = await tab.query('nav.main-menu')
        specific_item = await tab.query('//div[@data-testid="item-123"]')
        # With timeout and error handling
        delayed_element = await tab.find(
            class_name='dynamic-content',
            timeout=10,
            raise_exc=False  # Returns None if not found
        )
        # Advanced: Custom attributes
        custom_element = await tab.find(
            data_testid='submit-button',
            aria_label='Submit form'
        )

asyncio.run(element_finding_examples())
```

find 方法更为友好。我们可以通过常见属性（如 id、tag_name、class_name 等）进行元素查找，甚至支持自定义属性（例如 data-testid）。

如果这些基础方式仍不能满足需求，还可使用 query 方法，通过 CSS 选择器、XPath 查询语句等多种方式进行元素定位。Pydoll 会自动识别当前使用的查询类型。

### 并发自动化

Pydoll 的一大优势在于其基于异步实现的多任务并行处理能力。我们可以同时自动化操作多个浏览器标签页！下面来看具体示例：

```python
import asyncio
from pydoll.browser import Chrome

async def scrape_page(url, tab):
    await tab.go_to(url)
    title = await tab.execute_script('return document.title')
    links = await tab.find(tag_name='a', find_all=True)
    return {
        'url': url,
        'title': title,
        'link_count': len(links)
    }

async def concurrent_scraping():
    browser = Chrome()
    tab_google = await browser.start()
    tab_duckduckgo = await browser.new_tab()
    tasks = [
        scrape_page('https://google.com/', tab_google),
        scrape_page('https://duckduckgo.com/', tab_duckduckgo)
    ]
    results = await asyncio.gather(*tasks)
    print(results)
    await browser.stop()

asyncio.run(concurrent_scraping())
```

下方展示令人惊叹的执行速度：

![concurrent_example](./docs/images/concurrent-example.gif)


这个例子,我们成功实现了同时对两个页面的数据提取.
还有更多强大功能！响应式自动化的事件系统、请求拦截与修改等等。赶快查阅文档!

## 🔧 快速问题排查

**找不到浏览器？**
```python
from pydoll.browser import Chrome
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.binary_location = '/path/to/your/chrome'
browser = Chrome(options=options)
```

**浏览器在 FailedToStartBrowser 错误后启动？**
```python
from pydoll.browser import Chrome
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.start_timeout = 20  # 默认是 10 秒

browser = Chrome(options=options)
```

**需要代理？**
```python
options.add_argument('--proxy-server=your-proxy:port')
```

**在 Docker 中运行？**
```python
options.add_argument('--no-sandbox')
options.add_argument('--disable-dev-shm-usage')
```

## 📚 文档

Pydoll 的完整文档、详细示例以及对所有功能的深入探讨可以通过以下链接访问： [官方文档](https://autoscrape-labs.github.io/pydoll/).

文档包含以下部分:
- **快速上手指南** - 分步教程
- **API 参考** - 完整的方法文档
- **高级技巧** - 网络拦截、事件处理、性能优化

>此 README 的中文版本在[这里](README_zh.md)。

## 🤝 贡献

我们很乐意看到您的帮助让 Pydoll 变得更好！查看我们的[贡献指南](CONTRIBUTING.md)开始贡献。无论是修复错误、添加功能还是改进文档 - 所有贡献都受欢迎！

请确保：
- 为新功能或错误修复编写测试
- 遵循代码风格和约定
- 对拉取请求使用约定式提交
- 在提交前运行 lint 检查和测试

## 💖 支持我的工作

如果您发现 Pydoll 有用，请考虑[在 GitHub 上支持我](https://github.com/sponsors/thalissonvs)。  
您将获得独家优惠，如优先支持、自定义功能等等！

现在无法赞助？没问题，您仍然可以通过以下方式提供很大帮助：
- 为仓库加星
- 在社交媒体上分享
- 撰写文章或教程
- 提供反馈或报告问题

每一点支持都很重要/

## 💬 传播消息

如果 Pydoll 为您节省了时间、心理健康或者拯救了一个键盘免于被砸，请给它一个 ⭐，分享它，或者告诉您奇怪的开发者朋友。

## 📄 许可证

Pydoll 在 [MIT 许可证](LICENSE) 下获得许可。

<p align="center">
  <b>Pydoll</b> — 让浏览器自动化变得神奇！
</p>


================================================
FILE: SPONSORS.md
================================================
# Sponsors

Pydoll is supported by these amazing sponsors. Their contributions help keep the project maintained and growing.

## Top Sponsors

<a href="https://substack.thewebscraping.club/p/pydoll-webdriver-scraping?utm_source=github&utm_medium=repo&utm_campaign=pydoll">
<img alt="The Web Scraping Club" src="public/images/banner-the-webscraping-club.png" />
</a>

Read a full review of Pydoll on **[The Web Scraping Club](https://substack.thewebscraping.club/p/pydoll-webdriver-scraping?utm_source=github&utm_medium=repo&utm_campaign=pydoll)**, the #1 newsletter dedicated to web scraping.

---

## Sponsors

<a href="https://www.thordata.com/?ls=github&lk=pydoll">
<img alt="Thordata" src="public/images/thordata.png" />
</a>

Pydoll is proudly sponsored by **[Thordata](https://www.thordata.com/?ls=github&lk=pydoll)**: a residential proxy network built for serious web scraping and automation. With **190+ real residential and ISP locations**, fully encrypted connections, and infrastructure optimized for high-performance workflows, Thordata is an excellent choice for scaling your Pydoll automations.

**[Sign up through our link](https://www.thordata.com/?ls=github&lk=pydoll)** to support the project and get **1GB free** to get started.

---

<a href="https://dashboard.capsolver.com/passport/register?inviteCode=WPhTbOsbXEpc">
<img alt="CapSolver" src="public/images/capsolver.jpeg" />
</a>

Pydoll excels at behavioral evasion, but it doesn't solve captchas. That's where **[CapSolver](https://dashboard.capsolver.com/passport/register?inviteCode=WPhTbOsbXEpc)** comes in. An AI-powered service that handles reCAPTCHA, Cloudflare challenges, and more, seamlessly integrating with your automation workflows.

**[Register with our invite code](https://dashboard.capsolver.com/passport/register?inviteCode=WPhTbOsbXEpc)** and use code **PYDOLL** to get an extra **6% balance bonus**.

---

Interested in sponsoring Pydoll? [Become a sponsor](https://github.com/sponsors/thalissonvs).


================================================
FILE: codecov.yml
================================================
coverage:
  status:
    project: 
      default:
        target: 90%
        threshold: 0%
        base: auto 

================================================
FILE: cz.yaml
================================================
---
commitizen:
  name: cz_conventional_commits
  tag_format: $version
  version: 2.21.3


================================================
FILE: docs/en/api/browser/chrome.md
================================================
# Chrome Browser
 
::: pydoll.browser.chromium.Chrome
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2 

================================================
FILE: docs/en/api/browser/edge.md
================================================
# Edge Browser
 
::: pydoll.browser.chromium.Edge
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2 

================================================
FILE: docs/en/api/browser/managers.md
================================================
# Browser Managers

The managers module provides specialized classes for managing different aspects of browser lifecycle and configuration.

## Overview

Browser managers handle specific responsibilities in browser automation:

::: pydoll.browser.managers
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Manager Classes

### Browser Process Manager
Manages the browser process lifecycle, including starting, stopping, and monitoring browser processes.

::: pydoll.browser.managers.browser_process_manager
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3

### Browser Options Manager
Handles browser configuration options and command-line arguments.

::: pydoll.browser.managers.browser_options_manager
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3

### Proxy Manager
Manages proxy configuration and authentication for browser instances.

::: pydoll.browser.managers.proxy_manager
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3

### Temporary Directory Manager
Handles creation and cleanup of temporary directories used by browser instances.

::: pydoll.browser.managers.temp_dir_manager
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3

## Usage

Managers are typically used internally by browser classes like `Chrome` and `Edge`. They provide modular functionality that can be composed together:

```python
from pydoll.browser.managers.proxy_manager import ProxyManager
from pydoll.browser.managers.temp_dir_manager import TempDirManager

# Managers are used internally by browser classes
# Direct usage is for advanced scenarios only
proxy_manager = ProxyManager()
temp_manager = TempDirManager()
```

!!! note "Internal Usage"
    These managers are primarily used internally by the browser classes. Direct usage is recommended only for advanced scenarios or when extending the library. 

================================================
FILE: docs/en/api/browser/options.md
================================================
# Browser Options

## ChromiumOptions

::: pydoll.browser.options.ChromiumOptions
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3

## Options Interface

::: pydoll.browser.interfaces.Options
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3

## BrowserOptionsManager Interface

::: pydoll.browser.interfaces.BrowserOptionsManager
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3 

================================================
FILE: docs/en/api/browser/requests.md
================================================
# Browser Requests

The requests module provides HTTP request capabilities within the browser context, enabling seamless API calls that inherit the browser's session state, cookies, and authentication.

## Overview

The browser requests module offers a `requests`-like interface for making HTTP calls directly within the browser's JavaScript context. This approach provides several advantages over traditional HTTP libraries:

- **Session inheritance**: Automatic cookie, authentication, and CORS handling
- **Browser context**: Requests execute in the same security context as the page
- **No session juggling**: Eliminate the need to transfer cookies and tokens between automation and API calls
- **SPA compatibility**: Perfect for Single Page Applications with complex authentication flows

## Request Class

The main interface for making HTTP requests within the browser context.

::: pydoll.browser.requests.request.Request
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3
      group_by_category: true
      members_order: source
      filters:
        - "!^__"

## Response Class

Represents the response from HTTP requests, providing a familiar interface similar to the `requests` library.

::: pydoll.browser.requests.response.Response
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3
      group_by_category: true
      members_order: source
      filters:
        - "!^__"

## Usage Examples

### Basic HTTP Methods

```python
from pydoll.browser.chromium import Chrome

async with Chrome() as browser:
    tab = await browser.start()
    await tab.go_to("https://api.example.com")
    
    # GET request
    response = await tab.request.get("/users/123")
    user_data = await response.json()
    
    # POST request
    response = await tab.request.post("/users", json={
        "name": "John Doe",
        "email": "john@example.com"
    })
    
    # PUT request with headers
    response = await tab.request.put("/users/123", 
        json={"name": "Jane Doe"},
        headers={"Authorization": "Bearer token123"}
    )
```

### Response Handling

```python
# Check response status
if response.ok:
    print(f"Success: {response.status_code}")
else:
    print(f"Error: {response.status_code}")
    response.raise_for_status()  # Raises HTTPError for 4xx/5xx

# Access response data
text_data = response.text
json_data = await response.json()
raw_bytes = response.content

# Inspect headers and cookies
print("Response headers:", response.headers)
print("Request headers:", response.request_headers)
for cookie in response.cookies:
    print(f"Cookie: {cookie.name}={cookie.value}")
```

### Advanced Features

```python
# Request with custom headers and parameters
response = await tab.request.get("/search", 
    params={"q": "python", "limit": 10},
    headers={
        "User-Agent": "Custom Bot 1.0",
        "Accept": "application/json"
    }
)

# File upload simulation
response = await tab.request.post("/upload",
    data={"description": "Test file"},
    files={"file": ("test.txt", "file content", "text/plain")}
)

# Form data submission
response = await tab.request.post("/login",
    data={"username": "user", "password": "pass"}
)
```

## Integration with Tab

The request functionality is accessed through the `tab.request` property, which provides a singleton `Request` instance for each tab:

```python
# Each tab has its own request instance
tab1 = await browser.get_tab(0)
tab2 = await browser.new_tab()

# These are separate Request instances
request1 = tab1.request  # Request bound to tab1
request2 = tab2.request  # Request bound to tab2

# Requests inherit the tab's context
await tab1.go_to("https://site1.com")
await tab2.go_to("https://site2.com")

# These requests will have different cookie/session contexts
response1 = await tab1.request.get("/api/data")  # Uses site1.com cookies
response2 = await tab2.request.get("/api/data")  # Uses site2.com cookies
```

!!! tip "Hybrid Automation"
    This module is particularly powerful for hybrid automation scenarios where you need to combine UI interactions with API calls. For example, log in through the UI, then use the authenticated session for API calls without manually handling cookies or tokens.

================================================
FILE: docs/en/api/browser/tab.md
================================================
# Tab

::: pydoll.browser.tab.Tab
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/en/api/commands/browser.md
================================================
# Browser Commands

Browser commands provide low-level control over browser instances and their configuration.

## Overview

The browser commands module handles browser-level operations such as version information, target management, and browser-wide settings.

::: pydoll.commands.browser_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Usage

Browser commands are typically used internally by browser classes to manage browser instances:

```python
from pydoll.commands.browser_commands import get_version
from pydoll.connection.connection_handler import ConnectionHandler

# Get browser version information
connection = ConnectionHandler()
version_info = await get_version(connection)
```

## Available Commands

The browser commands module provides functions for:

- Getting browser version and user agent information
- Managing browser targets (tabs, windows)
- Controlling browser-wide settings and permissions
- Handling browser lifecycle events

!!! note "Internal Usage"
    These commands are primarily used internally by the `Chrome` and `Edge` browser classes. Direct usage is recommended only for advanced scenarios. 

================================================
FILE: docs/en/api/commands/dom.md
================================================
# DOM Commands

DOM commands provide comprehensive functionality for interacting with the Document Object Model of web pages.

## Overview

The DOM commands module is one of the most important modules in Pydoll, providing all the functionality needed to find, interact with, and manipulate HTML elements on web pages.

::: pydoll.commands.dom_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Usage

DOM commands are used extensively by the `WebElement` class and element finding methods:

```python
from pydoll.commands.dom_commands import query_selector, get_attributes
from pydoll.connection.connection_handler import ConnectionHandler

# Find element and get its attributes
connection = ConnectionHandler()
node_id = await query_selector(connection, selector="#username")
attributes = await get_attributes(connection, node_id=node_id)
```

## Key Functionality

The DOM commands module provides functions for:

### Element Finding
- `query_selector()` - Find single element by CSS selector
- `query_selector_all()` - Find multiple elements by CSS selector
- `get_document()` - Get the document root node

### Element Interaction
- `click_element()` - Click on elements
- `focus_element()` - Focus elements
- `set_attribute_value()` - Set element attributes
- `get_attributes()` - Get element attributes

### Element Information
- `get_box_model()` - Get element positioning and dimensions
- `describe_node()` - Get detailed element information
- `get_outer_html()` - Get element HTML content

### DOM Manipulation
- `remove_node()` - Remove elements from DOM
- `set_node_value()` - Set element values
- `request_child_nodes()` - Get child elements

!!! tip "High-Level APIs"
    While these commands provide powerful low-level access, most users should use the higher-level `WebElement` class methods like `click()`, `type_text()`, and `get_attribute()` which use these commands internally. 

================================================
FILE: docs/en/api/commands/fetch.md
================================================
# Fetch Commands

Fetch commands provide advanced network request handling and interception capabilities using the Fetch API domain.

## Overview

The fetch commands module enables sophisticated network request management, including request modification, response interception, and authentication handling.

::: pydoll.commands.fetch_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Usage

Fetch commands are used for advanced network interception and request handling:

```python
from pydoll.commands.fetch_commands import enable, request_paused, continue_request
from pydoll.connection.connection_handler import ConnectionHandler

# Enable fetch domain
connection = ConnectionHandler()
await enable(connection, patterns=[{
    "urlPattern": "*",
    "requestStage": "Request"
}])

# Handle paused requests
async def handle_paused_request(request_id, request):
    # Modify request or continue as-is
    await continue_request(connection, request_id=request_id)
```

## Key Functionality

The fetch commands module provides functions for:

### Request Interception
- `enable()` - Enable fetch domain with patterns
- `disable()` - Disable fetch domain
- `continue_request()` - Continue intercepted requests
- `fail_request()` - Fail requests with specific errors

### Request Modification
- Modify request headers
- Change request URLs
- Alter request methods (GET, POST, etc.)
- Modify request bodies

### Response Handling
- `fulfill_request()` - Provide custom responses
- `get_response_body()` - Get response content
- Response header modification
- Response status code control

### Authentication
- `continue_with_auth()` - Handle authentication challenges
- Basic authentication support
- Custom authentication flows

## Advanced Features

### Pattern-Based Interception
```python
# Intercept specific URL patterns
patterns = [
    {"urlPattern": "*/api/*", "requestStage": "Request"},
    {"urlPattern": "*.js", "requestStage": "Response"},
    {"urlPattern": "https://example.com/*", "requestStage": "Request"}
]

await enable(connection, patterns=patterns)
```

### Request Modification
```python
# Modify intercepted requests
async def modify_request(request_id, request):
    # Add authentication header
    headers = request.headers.copy()
    headers["Authorization"] = "Bearer token123"
    
    # Continue with modified headers
    await continue_request(
        connection,
        request_id=request_id,
        headers=headers
    )
```

### Response Mocking
```python
# Mock API responses
await fulfill_request(
    connection,
    request_id=request_id,
    response_code=200,
    response_headers=[
        {"name": "Content-Type", "value": "application/json"},
        {"name": "Access-Control-Allow-Origin", "value": "*"}
    ],
    body='{"status": "success", "data": {"mocked": true}}'
)
```

### Authentication Handling
```python
# Handle authentication challenges
await continue_with_auth(
    connection,
    request_id=request_id,
    auth_challenge_response={
        "response": "ProvideCredentials",
        "username": "user",
        "password": "pass"
    }
)
```

## Request Stages

Fetch commands can intercept requests at different stages:

| Stage | Description | Use Cases |
|-------|-------------|-----------|
| Request | Before request is sent | Modify headers, URL, method |
| Response | After response received | Mock responses, modify content |

## Error Handling

```python
# Fail requests with specific errors
await fail_request(
    connection,
    request_id=request_id,
    error_reason="ConnectionRefused"  # or "AccessDenied", "TimedOut", etc.
)
```

## Integration with Network Commands

Fetch commands work alongside network commands but provide more granular control:

- **Network Commands**: Broader network monitoring and control
- **Fetch Commands**: Specific request/response interception and modification

!!! tip "Performance Considerations"
    Fetch interception can impact page loading performance. Use specific URL patterns and disable when not needed to minimize overhead. 

================================================
FILE: docs/en/api/commands/index.md
================================================
# Commands Overview

The Commands module provides high-level interfaces for interacting with Chrome DevTools Protocol (CDP) domains. Each command module corresponds to a specific CDP domain and provides methods to execute various browser operations.

## Available Command Modules

### Browser Commands
- **Module**: `browser_commands.py`
- **Purpose**: Browser-level operations and window management
- **Documentation**: [Browser Commands](browser.md)

### DOM Commands
- **Module**: `dom_commands.py`
- **Purpose**: DOM tree manipulation and element operations
- **Documentation**: [DOM Commands](dom.md)

### Input Commands
- **Module**: `input_commands.py`
- **Purpose**: Input event simulation (keyboard, mouse, touch)
- **Documentation**: [Input Commands](input.md)

### Network Commands
- **Module**: `network_commands.py`
- **Purpose**: Network monitoring and request interception
- **Documentation**: [Network Commands](network.md)

### Page Commands
- **Module**: `page_commands.py`
- **Purpose**: Page lifecycle management and navigation
- **Documentation**: [Page Commands](page.md)

### Runtime Commands
- **Module**: `runtime_commands.py`
- **Purpose**: JavaScript execution and runtime management
- **Documentation**: [Runtime Commands](runtime.md)

### Storage Commands
- **Module**: `storage_commands.py`
- **Purpose**: Browser storage access (cookies, local storage, etc.)
- **Documentation**: [Storage Commands](storage.md)

### Target Commands
- **Module**: `target_commands.py`
- **Purpose**: Target management and tab operations
- **Documentation**: [Target Commands](target.md)

### Fetch Commands
- **Module**: `fetch_commands.py`
- **Purpose**: Network request interception and modification
- **Documentation**: [Fetch Commands](fetch.md)

## Usage Pattern

Commands are typically accessed through the browser or tab instances:

```python
from pydoll.browser.chromium import Chrome

# Initialize browser
browser = Chrome()
await browser.start()

# Get active tab
tab = await browser.get_active_tab()

# Use commands through the tab
await tab.navigate("https://example.com")
element = await tab.find(id="button")
await element.click()
```

## Command Structure

Each command module follows a consistent pattern:
- **Static methods**: For direct command execution
- **Type hints**: Full type safety with protocol types
- **Error handling**: Proper exception handling for CDP errors
- **Documentation**: Comprehensive docstrings with examples 

================================================
FILE: docs/en/api/commands/input.md
================================================
# Input Commands

Input commands handle mouse and keyboard interactions, providing human-like input simulation.

## Overview

The input commands module provides functionality for simulating user input including mouse movements, clicks, keyboard typing, and key presses.

::: pydoll.commands.input_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Usage

Input commands are used by element interaction methods and can be used directly for advanced input scenarios:

```python
from pydoll.commands.input_commands import dispatch_mouse_event, dispatch_key_event
from pydoll.connection.connection_handler import ConnectionHandler

# Simulate mouse click
connection = ConnectionHandler()
await dispatch_mouse_event(
    connection, 
    type="mousePressed", 
    x=100, 
    y=200, 
    button="left"
)

# Simulate keyboard typing
await dispatch_key_event(
    connection,
    type="keyDown",
    key="Enter"
)
```

## Key Functionality

The input commands module provides functions for:

### Mouse Events
- `dispatch_mouse_event()` - Mouse clicks, movements, and wheel events
- Mouse button states (left, right, middle)
- Coordinate-based positioning
- Drag and drop operations

### Keyboard Events
- `dispatch_key_event()` - Key press and release events
- `insert_text()` - Direct text insertion
- Special key handling (Enter, Tab, Arrow keys, etc.)
- Modifier keys (Ctrl, Alt, Shift)

### Touch Events
- Touch screen simulation
- Multi-touch gestures
- Touch coordinates and pressure

## Human-like Behavior

The input commands support human-like behavior patterns:

- Natural mouse movement curves
- Realistic typing speeds and patterns
- Random micro-delays between actions
- Pressure-sensitive touch events

!!! tip "Element Methods"
    For most use cases, use the higher-level element methods like `element.click()` and `element.type_text()` which provide a more convenient API and handle common scenarios automatically. 

================================================
FILE: docs/en/api/commands/network.md
================================================
# Network Commands

Network commands provide comprehensive control over network requests, responses, and browser networking behavior.

## Overview

The network commands module enables request interception, response modification, cookie management, and network monitoring capabilities.

::: pydoll.commands.network_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Usage

Network commands are used for advanced scenarios like request interception and network monitoring:

```python
from pydoll.commands.network_commands import enable, set_request_interception
from pydoll.connection.connection_handler import ConnectionHandler

# Enable network monitoring
connection = ConnectionHandler()
await enable(connection)

# Enable request interception
await set_request_interception(connection, patterns=[{"urlPattern": "*"}])
```

## Key Functionality

The network commands module provides functions for:

### Request Management
- `enable()` / `disable()` - Enable/disable network monitoring
- `set_request_interception()` - Intercept and modify requests
- `continue_intercepted_request()` - Continue or modify intercepted requests
- `get_request_post_data()` - Get request body data

### Response Handling
- `get_response_body()` - Get response content
- `fulfill_request()` - Provide custom responses
- `fail_request()` - Simulate network failures

### Cookie Management
- `get_cookies()` - Get browser cookies
- `set_cookies()` - Set browser cookies
- `delete_cookies()` - Delete specific cookies
- `clear_browser_cookies()` - Clear all cookies

### Cache Control
- `clear_browser_cache()` - Clear browser cache
- `set_cache_disabled()` - Disable browser cache
- `get_response_body_for_interception()` - Get cached responses

### Security & Headers
- `set_user_agent_override()` - Override user agent
- `set_extra_http_headers()` - Add custom headers
- `emulate_network_conditions()` - Simulate network conditions

## Advanced Use Cases

### Request Interception
```python
# Intercept and modify requests
await set_request_interception(connection, patterns=[
    {"urlPattern": "*/api/*", "requestStage": "Request"}
])

# Handle intercepted request
async def handle_request(request):
    if "api/login" in request.url:
        # Modify request headers
        headers = request.headers.copy()
        headers["Authorization"] = "Bearer token"
        await continue_intercepted_request(
            connection, 
            request_id=request.request_id,
            headers=headers
        )
```

### Response Mocking
```python
# Mock API responses
await fulfill_request(
    connection,
    request_id=request_id,
    response_code=200,
    response_headers={"Content-Type": "application/json"},
    body='{"status": "success"}'
)
```

!!! warning "Performance Impact"
    Network interception can impact page loading performance. Use selectively and disable when not needed. 

================================================
FILE: docs/en/api/commands/page.md
================================================
# Page Commands

Page commands handle page navigation, lifecycle events, and page-level operations.

## Overview

The page commands module provides functionality for navigating between pages, managing page lifecycle, handling JavaScript execution, and controlling page behavior.

::: pydoll.commands.page_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Usage

Page commands are used extensively by the `Tab` class for navigation and page management:

```python
from pydoll.commands.page_commands import navigate, reload, enable
from pydoll.connection.connection_handler import ConnectionHandler

# Navigate to a URL
connection = ConnectionHandler()
await enable(connection)  # Enable page events
await navigate(connection, url="https://example.com")

# Reload the page
await reload(connection)
```

## Key Functionality

The page commands module provides functions for:

### Navigation
- `navigate()` - Navigate to URLs
- `reload()` - Reload current page
- `go_back()` - Navigate back in history
- `go_forward()` - Navigate forward in history
- `stop_loading()` - Stop page loading

### Page Lifecycle
- `enable()` / `disable()` - Enable/disable page events
- `get_frame_tree()` - Get page frame structure
- `get_navigation_history()` - Get navigation history

### Content Management
- `get_resource_content()` - Get page resource content
- `search_in_resource()` - Search within page resources
- `set_document_content()` - Set page HTML content

### Screenshots & PDF
- `capture_screenshot()` - Take page screenshots
- `print_to_pdf()` - Generate PDF from page
- `capture_snapshot()` - Capture page snapshots

### JavaScript Execution
- `add_script_to_evaluate_on_new_document()` - Add startup scripts
- `remove_script_to_evaluate_on_new_document()` - Remove startup scripts

### Page Settings
- `set_lifecycle_events_enabled()` - Control lifecycle events
- `set_ad_blocking_enabled()` - Enable/disable ad blocking
- `set_bypass_csp()` - Bypass Content Security Policy

## Advanced Features

### Frame Management
```python
# Get all frames in the page
frame_tree = await get_frame_tree(connection)
for frame in frame_tree.child_frames:
    print(f"Frame: {frame.frame.url}")
```

### Resource Interception
```python
# Get resource content
content = await get_resource_content(
    connection, 
    frame_id=frame_id, 
    url="https://example.com/script.js"
)
```

### Page Events
The page commands work with various page events:
- `Page.loadEventFired` - Page load completed
- `Page.domContentEventFired` - DOM content loaded
- `Page.frameNavigated` - Frame navigation
- `Page.frameStartedLoading` - Frame loading started

!!! tip "Tab Class Integration"
    Most page operations are available through the `Tab` class methods like `tab.go_to()`, `tab.reload()`, and `tab.screenshot()` which provide a more convenient API. 

================================================
FILE: docs/en/api/commands/runtime.md
================================================
# Runtime Commands

Runtime commands provide JavaScript execution capabilities and runtime environment management.

## Overview

The runtime commands module enables JavaScript code execution, object inspection, and runtime environment control within browser contexts.

::: pydoll.commands.runtime_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Usage

Runtime commands are used for JavaScript execution and runtime management:

```python
from pydoll.commands.runtime_commands import evaluate, enable
from pydoll.connection.connection_handler import ConnectionHandler

# Enable runtime events
connection = ConnectionHandler()
await enable(connection)

# Execute JavaScript
result = await evaluate(
    connection, 
    expression="document.title",
    return_by_value=True
)
print(result.value)  # Page title
```

## Key Functionality

The runtime commands module provides functions for:

### JavaScript Execution
- `evaluate()` - Execute JavaScript expressions
- `call_function_on()` - Call functions on objects
- `compile_script()` - Compile JavaScript for reuse
- `run_script()` - Run compiled scripts

### Object Management
- `get_properties()` - Get object properties
- `release_object()` - Release object references
- `release_object_group()` - Release object groups

### Runtime Control
- `enable()` / `disable()` - Enable/disable runtime events
- `discard_console_entries()` - Clear console entries
- `set_custom_object_formatter_enabled()` - Enable custom formatters

### Exception Handling
- `set_async_call_stack_depth()` - Set call stack depth
- Exception capture and reporting
- Error object inspection

## Advanced Usage

### Complex JavaScript Execution
```python
# Execute complex JavaScript with error handling
script = """
try {
    const elements = document.querySelectorAll('.item');
    return Array.from(elements).map(el => ({
        text: el.textContent,
        href: el.href
    }));
} catch (error) {
    return { error: error.message };
}
"""

result = await evaluate(
    connection,
    expression=script,
    return_by_value=True,
    await_promise=True
)
```

### Object Inspection
```python
# Get detailed object properties
properties = await get_properties(
    connection,
    object_id=object_id,
    own_properties=True,
    accessor_properties_only=False
)

for prop in properties:
    print(f"{prop.name}: {prop.value}")
```

### Console Integration
Runtime commands integrate with browser console:
- Console messages and errors
- Console API method calls
- Custom console formatters

!!! note "Performance Considerations"
    JavaScript execution through runtime commands can be slower than native browser execution. Use judiciously for complex operations. 

================================================
FILE: docs/en/api/commands/storage.md
================================================
# Storage Commands

Storage commands provide comprehensive browser storage management including cookies, localStorage, sessionStorage, and IndexedDB.

## Overview

The storage commands module enables management of all browser storage mechanisms, providing functionality for data persistence and retrieval.

::: pydoll.commands.storage_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Usage

Storage commands are used for managing browser storage across different mechanisms:

```python
from pydoll.commands.storage_commands import get_cookies, set_cookies, clear_data_for_origin
from pydoll.connection.connection_handler import ConnectionHandler

# Get cookies for a domain
connection = ConnectionHandler()
cookies = await get_cookies(connection, urls=["https://example.com"])

# Set a new cookie
await set_cookies(connection, cookies=[{
    "name": "session_id",
    "value": "abc123",
    "domain": "example.com",
    "path": "/",
    "httpOnly": True,
    "secure": True
}])

# Clear all storage for an origin
await clear_data_for_origin(
    connection,
    origin="https://example.com",
    storage_types="all"
)
```

## Key Functionality

The storage commands module provides functions for:

### Cookie Management
- `get_cookies()` - Get cookies by URL or domain
- `set_cookies()` - Set new cookies
- `delete_cookies()` - Delete specific cookies
- `clear_cookies()` - Clear all cookies

### Local Storage
- `get_dom_storage_items()` - Get localStorage items
- `set_dom_storage_item()` - Set localStorage item
- `remove_dom_storage_item()` - Remove localStorage item
- `clear_dom_storage()` - Clear localStorage

### Session Storage
- Session storage operations (similar to localStorage)
- Session-specific data management
- Tab-isolated storage

### IndexedDB
- `get_database_names()` - Get IndexedDB databases
- `request_database()` - Access database structure
- `request_data()` - Query database data
- `clear_object_store()` - Clear object stores

### Cache Storage
- `request_cache_names()` - Get cache names
- `request_cached_response()` - Get cached responses
- `delete_cache()` - Delete cache entries

### Application Cache (Deprecated)
- Legacy application cache support
- Manifest-based caching

## Advanced Features

### Bulk Operations
```python
# Clear all storage types for multiple origins
origins = ["https://example.com", "https://api.example.com"]
for origin in origins:
    await clear_data_for_origin(
        connection,
        origin=origin,
        storage_types="cookies,local_storage,session_storage,indexeddb"
    )
```

### Storage Quotas
```python
# Get storage quota information
quota_info = await get_usage_and_quota(connection, origin="https://example.com")
print(f"Used: {quota_info.usage} bytes")
print(f"Quota: {quota_info.quota} bytes")
```

### Cross-Origin Storage
```python
# Manage storage across different origins
await set_cookies(connection, cookies=[{
    "name": "cross_site_token",
    "value": "token123",
    "domain": ".example.com",  # Applies to all subdomains
    "sameSite": "None",
    "secure": True
}])
```

## Storage Types

The module supports various storage mechanisms:

| Storage Type | Persistence | Scope | Capacity |
|--------------|-------------|-------|----------|
| Cookies | Persistent | Domain/Path | ~4KB per cookie |
| localStorage | Persistent | Origin | ~5-10MB |
| sessionStorage | Session | Tab | ~5-10MB |
| IndexedDB | Persistent | Origin | Large (GB+) |
| Cache API | Persistent | Origin | Large |

!!! warning "Privacy Considerations"
    Storage operations can affect user privacy. Always handle storage data responsibly and in compliance with privacy regulations. 

================================================
FILE: docs/en/api/commands/target.md
================================================
# Target Commands

Target commands manage browser targets including tabs, windows, and other browsing contexts.

## Overview

The target commands module provides functionality for creating, managing, and controlling browser targets such as tabs, popup windows, and service workers.

::: pydoll.commands.target_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Usage

Target commands are used internally by browser classes to manage tabs and windows:

```python
from pydoll.commands.target_commands import get_targets, create_target, close_target
from pydoll.connection.connection_handler import ConnectionHandler

# Get all browser targets
connection = ConnectionHandler()
targets = await get_targets(connection)

# Create a new tab
new_target = await create_target(connection, url="https://example.com")

# Close a target
await close_target(connection, target_id=new_target.target_id)
```

## Key Functionality

The target commands module provides functions for:

### Target Management
- `get_targets()` - List all browser targets
- `create_target()` - Create new tabs or windows
- `close_target()` - Close specific targets
- `activate_target()` - Bring target to foreground

### Target Information
- `get_target_info()` - Get detailed target information
- Target types: page, background_page, service_worker, browser
- Target states: attached, detached, crashed

### Session Management
- `attach_to_target()` - Attach to target for control
- `detach_from_target()` - Detach from target
- `send_message_to_target()` - Send commands to targets

### Browser Context
- `create_browser_context()` - Create isolated browser context
- `dispose_browser_context()` - Remove browser context
- `get_browser_contexts()` - List browser contexts

## Target Types

Different types of targets can be managed:

### Page Targets
```python
# Create a new tab
page_target = await create_target(
    connection,
    url="https://example.com",
    width=1920,
    height=1080,
    browser_context_id=None  # Default context
)
```

### Popup Windows
```python
# Create a popup window
popup_target = await create_target(
    connection,
    url="https://popup.example.com",
    width=800,
    height=600,
    new_window=True
)
```

### Incognito Contexts
```python
# Create incognito browser context
incognito_context = await create_browser_context(connection)

# Create tab in incognito context
incognito_tab = await create_target(
    connection,
    url="https://private.example.com",
    browser_context_id=incognito_context.browser_context_id
)
```

!!! info "Headless vs Headed: how contexts show up"
    Browser contexts are isolated logical environments. In headed mode, the first page created inside a new context will usually open in a new OS window. In headless mode, no window is shown — the isolation remains purely logical (cookies, storage, cache and auth state are still separate per context). Prefer contexts in headless/CI pipelines for performance and clean isolation.

## Advanced Features

### Target Events
Target commands work with various target events:
- `Target.targetCreated` - New target created
- `Target.targetDestroyed` - Target closed
- `Target.targetInfoChanged` - Target information updated
- `Target.targetCrashed` - Target crashed

### Multi-Target Coordination
```python
# Manage multiple tabs
targets = await get_targets(connection)
page_targets = [t for t in targets if t.type == "page"]

for target in page_targets:
    # Perform operations on each tab
    await activate_target(connection, target_id=target.target_id)
    # ... do work in this tab
```

### Target Isolation
```python
# Create isolated browser context for testing
test_context = await create_browser_context(connection)

# All targets in this context are isolated
test_tab1 = await create_target(
    connection, 
    url="https://test1.com",
    browser_context_id=test_context.browser_context_id
)

test_tab2 = await create_target(
    connection,
    url="https://test2.com", 
    browser_context_id=test_context.browser_context_id
)
```

!!! note "Browser Integration"
    Target commands are primarily used internally by the `Chrome` and `Edge` browser classes. The high-level browser APIs provide more convenient methods for tab management. 

================================================
FILE: docs/en/api/connection/connection.md
================================================
# Connection Handler

::: pydoll.connection.connection_handler.ConnectionHandler
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/en/api/connection/managers.md
================================================
# Connection Managers

## CommandsManager

::: pydoll.connection.managers.commands_manager.CommandsManager
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3

## EventsManager

::: pydoll.connection.managers.events_manager.EventsManager
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3 

================================================
FILE: docs/en/api/core/constants.md
================================================
# Constants

This section documents all constants, enums, and configuration values used throughout Pydoll.

::: pydoll.constants
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      group_by_category: true
      members_order: source 

================================================
FILE: docs/en/api/core/exceptions.md
================================================
# Exceptions

This section documents all custom exceptions that can be raised by Pydoll operations.

::: pydoll.exceptions
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      group_by_category: true
      members_order: source 

================================================
FILE: docs/en/api/core/utils.md
================================================
# Utilities

This section documents utility functions and helper classes used throughout Pydoll.

::: pydoll.utils
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      group_by_category: true
      members_order: source 

================================================
FILE: docs/en/api/elements/mixins.md
================================================
# Element Mixins

The mixins module provides reusable functionality that can be mixed into element classes to extend their capabilities.

## Find Elements Mixin

The `FindElementsMixin` provides element finding capabilities to classes that include it.

::: pydoll.elements.mixins.find_elements_mixin
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Usage

Mixins are typically used internally by the library to compose functionality. The `FindElementsMixin` is used by classes like `Tab` and `WebElement` to provide element finding methods:

```python
# These methods come from FindElementsMixin
element = await tab.find(id="username")
elements = await tab.find(class_name="item", find_all=True)
element = await tab.query("#submit-button")
```

## Available Methods

The `FindElementsMixin` provides several methods for finding elements:

- `find()` - Modern element finding with keyword arguments
- `query()` - CSS selector and XPath queries
- `find_element()` - Legacy element finding method
- `find_elements()` - Legacy method for finding multiple elements

!!! tip "Modern vs Legacy"
    The `find()` method is the modern, recommended approach for finding elements. The `find_element()` and `find_elements()` methods are maintained for backward compatibility. 

================================================
FILE: docs/en/api/elements/shadow_root.md
================================================
# ShadowRoot

::: pydoll.elements.shadow_root.ShadowRoot
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      members_order: source
      group_by_category: true


================================================
FILE: docs/en/api/elements/web_element.md
================================================
# WebElement

::: pydoll.elements.web_element.WebElement
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      members_order: source
      group_by_category: true 

================================================
FILE: docs/en/api/index.md
================================================
# API Reference

Welcome to the Pydoll API Reference! This section provides comprehensive documentation for all classes, methods, and functions available in the Pydoll library.

## Overview

Pydoll is organized into several key modules, each serving a specific purpose in browser automation:

### Browser Module
The browser module contains classes for managing browser instances and their lifecycle.

- **[Chrome](browser/chrome.md)** - Chrome browser automation
- **[Edge](browser/edge.md)** - Microsoft Edge browser automation  
- **[Options](browser/options.md)** - Browser configuration options
- **[Tab](browser/tab.md)** - Tab management and interaction
- **[Requests](browser/requests.md)** - HTTP requests within browser context
- **[Managers](browser/managers.md)** - Browser lifecycle managers

### Elements Module
The elements module provides classes for interacting with web page elements.

- **[WebElement](elements/web_element.md)** - Individual element interaction
- **[Mixins](elements/mixins.md)** - Reusable element functionality

### Connection Module
The connection module handles communication with the browser through the Chrome DevTools Protocol.

- **[Connection Handler](connection/connection.md)** - WebSocket connection management
- **[Managers](connection/managers.md)** - Connection lifecycle managers

### Commands Module
The commands module provides low-level Chrome DevTools Protocol command implementations.

- **[Commands Overview](commands/index.md)** - CDP command implementations by domain

### Protocol Module
The protocol module implements the Chrome DevTools Protocol commands and events.

- **[Base Types](protocol/base.md)** - Base types for Chrome DevTools Protocol
- **[Browser](protocol/browser.md)** - Browser domain commands and events
- **[DOM](protocol/dom.md)** - DOM domain commands and events
- **[Fetch](protocol/fetch.md)** - Fetch domain commands and events
- **[Input](protocol/input.md)** - Input domain commands and events
- **[Network](protocol/network.md)** - Network domain commands and events
- **[Page](protocol/page.md)** - Page domain commands and events
- **[Runtime](protocol/runtime.md)** - Runtime domain commands and events
- **[Storage](protocol/storage.md)** - Storage domain commands and events
- **[Target](protocol/target.md)** - Target domain commands and events

### Core Module
The core module contains fundamental utilities, constants, and exceptions.

- **[Constants](core/constants.md)** - Library constants and enums
- **[Exceptions](core/exceptions.md)** - Custom exception classes
- **[Utils](core/utils.md)** - Utility functions

## Quick Navigation

### Most Common Classes

| Class | Purpose | Module |
|-------|---------|--------|
| `Chrome` | Chrome browser automation | `pydoll.browser.chromium` |
| `Edge` | Edge browser automation | `pydoll.browser.chromium` |
| `Tab` | Tab interaction and control | `pydoll.browser.tab` |
| `WebElement` | Element interaction | `pydoll.elements.web_element` |
| `ChromiumOptions` | Browser configuration | `pydoll.browser.options` |

### Key Enums and Constants

| Name | Purpose | Module |
|------|---------|--------|
| `By` | Element selector strategies | `pydoll.constants` |
| `Key` | Keyboard key constants | `pydoll.constants` |
| `PermissionType` | Browser permission types | `pydoll.constants` |

### Common Exceptions

| Exception | When Raised | Module |
|-----------|-------------|--------|
| `ElementNotFound` | Element not found in DOM | `pydoll.exceptions` |
| `WaitElementTimeout` | Element wait timeout | `pydoll.exceptions` |
| `BrowserNotStarted` | Browser not started | `pydoll.exceptions` |

## Usage Patterns

### Basic Browser Automation

```python
from pydoll.browser.chromium import Chrome

async with Chrome() as browser:
    tab = await browser.start()
    await tab.go_to("https://example.com")
    element = await tab.find(id="my-element")
    await element.click()
```

### Element Finding

```python
# Using the modern find() method
element = await tab.find(id="username")
element = await tab.find(tag_name="button", class_name="submit")

# Using CSS selectors or XPath
element = await tab.query("#username")
element = await tab.query("//button[@class='submit']")
```

### Event Handling

```python
await tab.enable_page_events()
await tab.on('Page.loadEventFired', handle_page_load)
```

## Type Hints

Pydoll is fully typed and provides comprehensive type hints for better IDE support and code safety. All public APIs include proper type annotations.

```python
from typing import Optional, List
from pydoll.elements.web_element import WebElement

# Methods return properly typed objects
element: Optional[WebElement] = await tab.find(id="test", raise_exc=False)
elements: List[WebElement] = await tab.find(class_name="item", find_all=True)
```

## Async/Await Support

All Pydoll operations are asynchronous and must be used with `async`/`await`:

```python
import asyncio

async def main():
    # All Pydoll operations are async
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to("https://example.com")
        
asyncio.run(main())
```

Browse the sections below to explore the complete API documentation for each module. 

================================================
FILE: docs/en/api/protocol/base.md
================================================
# Protocol Base Types

Base types and structures for Chrome DevTools Protocol commands, responses, and events.

## Base Types

::: pydoll.protocol.base
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3
      group_by_category: true
      members_order: source
      filters:
        - "!^__"

================================================
FILE: docs/en/api/protocol/browser.md
================================================
# Browser Protocol

Browser domain commands, events and types for Chrome DevTools Protocol.

## Methods

::: pydoll.protocol.browser.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Events  

::: pydoll.protocol.browser.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Types

::: pydoll.protocol.browser.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/en/api/protocol/dom.md
================================================
# DOM Protocol

DOM domain commands and events for Chrome DevTools Protocol.

## Methods

::: pydoll.protocol.dom.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Events

::: pydoll.protocol.dom.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Types

::: pydoll.protocol.dom.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/en/api/protocol/fetch.md
================================================
# Fetch Protocol

Fetch domain commands, events and types for Chrome DevTools Protocol.

## Methods

::: pydoll.protocol.fetch.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Events

::: pydoll.protocol.fetch.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Types

::: pydoll.protocol.fetch.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/en/api/protocol/input.md
================================================
# Input Protocol

Input domain commands, events and types for Chrome DevTools Protocol.

## Methods

::: pydoll.protocol.input.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Events

::: pydoll.protocol.input.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Types

::: pydoll.protocol.input.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/en/api/protocol/network.md
================================================
# Network Protocol

Network domain commands and events for Chrome DevTools Protocol.

## Methods

::: pydoll.protocol.network.methods
    options:
      show_root_heading: false
      show_source: false
      heading_level: 2

## Events

::: pydoll.protocol.network.events
    options:
      show_root_heading: false
      show_source: false
      heading_level: 2

## Types

::: pydoll.protocol.network.types
    options:
      show_root_heading: false
      show_source: false
      heading_level: 2

================================================
FILE: docs/en/api/protocol/page.md
================================================
# Page Protocol

Page domain commands, events and types for Chrome DevTools Protocol.

## Methods

::: pydoll.protocol.page.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Events

::: pydoll.protocol.page.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Types

::: pydoll.protocol.page.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/en/api/protocol/runtime.md
================================================
# Runtime Protocol

Runtime domain commands, events and types for Chrome DevTools Protocol.

## Methods

::: pydoll.protocol.runtime.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Events

::: pydoll.protocol.runtime.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Types

::: pydoll.protocol.runtime.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/en/api/protocol/storage.md
================================================
# Storage Protocol

Storage domain commands, events and types for Chrome DevTools Protocol.

## Methods

::: pydoll.protocol.storage.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Events

::: pydoll.protocol.storage.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Types

::: pydoll.protocol.storage.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/en/api/protocol/target.md
================================================
# Target Protocol

Target domain commands and events for Chrome DevTools Protocol.

## Methods

::: pydoll.protocol.target.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Events

::: pydoll.protocol.target.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Types

::: pydoll.protocol.target.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/en/deep-dive/architecture/browser-domain.md
================================================
# Browser Domain Architecture

The Browser domain represents the highest level of Pydoll's automation hierarchy, managing the browser process lifecycle, CDP connections, context isolation, and global browser operations. This document explores the internal architecture, design decisions, and technical implementation of browser-level control.

!!! info "Practical Usage Guide"
    For practical examples and usage patterns, see the [Browser Management](../features/browser-management/tabs.md) and [Browser Contexts](../features/browser-management/contexts.md) guides.

## Architectural Overview

The Browser domain sits at the intersection of process management, protocol communication, and resource coordination. It orchestrates multiple specialized components to provide a unified interface for browser automation:

```mermaid
graph LR
    Browser[Browser Instance]
    Browser --> ProcessManager[Process Manager]
    Browser --> ProxyManager[Proxy Manager]
    Browser --> TempDirManager[Temp Directory Manager]
    Browser --> TabRegistry[Tab Registry]
    Browser --> ConnectionHandler[Connection Handler]
    
    ProcessManager --> |Manages| BrowserProcess[Browser Process]
    ConnectionHandler <--> |WebSocket| CDP[Chrome DevTools Protocol]
    TabRegistry --> |Manages| Tabs[Tab Instances]
    CDP <--> BrowserProcess
```

### Hierarchy and Abstraction

The Browser domain is implemented as an **abstract base class** that defines the contract for all browser implementations:

```python
class Browser(ABC):
    """Abstract base class for browser automation via CDP."""
    
    @abstractmethod
    def _get_default_binary_location(self) -> str:
        """Subclasses must provide browser-specific executable path."""
        pass
    
    async def start(self, headless: bool = False) -> Tab:
        """Concrete implementation shared by all browsers."""
        # 1. Resolve binary location
        # 2. Setup user data directory
        # 3. Start browser process
        # 4. Verify CDP connection
        # 5. Configure proxy (if needed)
        # 6. Return initial tab
```

This design enables **polymorphism** - Chrome, Edge, and other Chromium-based browsers share 99% of their code, differing only in executable paths and minor flag variations.

## Component Architecture

The Browser class coordinates several specialized managers, each responsible for a specific aspect of browser automation. Understanding these components is key to understanding Pydoll's design.

### Connection Handler

The ConnectionHandler is the **communication bridge** between Pydoll and the browser process. It manages:

- **WebSocket lifecycle**: Connection establishment, keep-alive, reconnection
- **Command execution**: Sending CDP commands and awaiting responses
- **Event dispatching**: Routing CDP events to registered callbacks
- **Callback registry**: Maintaining event listeners per connection

```python
class Browser:
    def __init__(self, ...):
        # ConnectionHandler is initialized with port or WebSocket address
        self._connection_handler = ConnectionHandler(self._connection_port)
    
    async def _execute_command(self, command, timeout=10):
        """All CDP commands flow through the connection handler."""
        return await self._connection_handler.execute_command(command, timeout)
```

!!! info "Connection Layer Deep Dive"
    For detailed information on WebSocket communication, command/response flow, and async patterns, see [Connection Layer Architecture](./connection-layer.md).

### Process Manager

The BrowserProcessManager handles **operating system process lifecycle**:

```python
class BrowserProcessManager:
    def start_browser_process(self, binary, port, arguments):
        """
        1. Constructs command-line with binary path + arguments
        2. Spawns subprocess with proper stdio handling
        3. Monitors process startup
        4. Stores process handle for later termination
        """
        
    def stop_process(self):
        """
        1. Attempts graceful termination (SIGTERM)
        2. Waits for process exit
        3. Force-kills if timeout exceeded (SIGKILL)
        4. Cleans up process resources
        """
```

**Why separate process management?**

- **Testability**: Process manager can be mocked for unit tests
- **Cross-platform**: Encapsulates OS-specific process handling
- **Reliability**: Handles edge cases like zombie processes, orphaned children

### Tab Registry

The Browser maintains a **registry of Tab instances** to ensure singleton behavior per target:

```python
class Browser:
    def __init__(self, ...):
        self._tabs_opened: dict[str, Tab] = {}
    
    async def new_tab(self, url='', browser_context_id=None) -> Tab:
        # Create target via CDP
        response = await self._execute_command(
            TargetCommands.create_target(browser_context_id=browser_context_id)
        )
        target_id = response['result']['targetId']
        
        # Check if tab already exists in registry
        if target_id in self._tabs_opened:
            return self._tabs_opened[target_id]
        
        # Create new Tab instance and register it
        tab = Tab(self, target_id=target_id, ...)
        self._tabs_opened[target_id] = tab
        return tab
```

**Why singleton Tab instances?**

- **State consistency**: Multiple references to same tab share state (enabled domains, callbacks)
- **Memory efficiency**: Prevents duplicate Tab instances for same target
- **Event routing**: Ensures events route to correct Tab instance

### Proxy Authentication Architecture

Pydoll implements **automatic proxy authentication** via the Fetch domain to avoid exposing credentials in CDP commands. The implementation uses **two distinct mechanisms** depending on proxy scope:

#### Mechanism 1: Browser-Level Proxy Auth (Global Proxy)

When a proxy is configured via `ChromiumOptions` (applies to all tabs in the default context):

```python
# In Browser.start() -> _configure_proxy()
async def _configure_proxy(self, private_proxy, proxy_credentials):
    # Enable Fetch AT BROWSER LEVEL
    await self.enable_fetch_events(handle_auth_requests=True)
    
    # Register callbacks AT BROWSER LEVEL (affects ALL tabs)
    await self.on(FetchEvent.REQUEST_PAUSED, self._continue_request_callback, temporary=True)
    await self.on(FetchEvent.AUTH_REQUIRED, 
                  partial(self._continue_request_with_auth_callback,
                          proxy_username=credentials[0],
                          proxy_password=credentials[1]),
                  temporary=True)
```

**Scope:** Browser-wide WebSocket connection → affects **all tabs in default context**

#### Mechanism 2: Tab-Level Proxy Auth (Per-Context Proxy)

When a proxy is configured per-context via `create_browser_context(proxy_server=...)`:

```python
# Store credentials per context
async def create_browser_context(self, proxy_server, ...):
    sanitized_proxy, extracted_auth = self._sanitize_proxy_and_extract_auth(proxy_server)
    
    response = await self._execute_command(
        TargetCommands.create_browser_context(proxy_server=sanitized_proxy)
    )
    context_id = response['result']['browserContextId']
    
    if extracted_auth:
        self._context_proxy_auth[context_id] = extracted_auth  # Store per context
    
    return context_id

# Setup auth for EACH tab in that context
async def _setup_context_proxy_auth_for_tab(self, tab, browser_context_id):
    creds = self._context_proxy_auth.get(browser_context_id)
    if not creds:
        return
    
    # Enable Fetch ON THE TAB (tab-level WebSocket)
    await tab.enable_fetch_events(handle_auth=True)
    
    # Register callbacks ON THE TAB (affects only this tab)
    await tab.on(FetchEvent.REQUEST_PAUSED, 
                 partial(self._tab_continue_request_callback, tab=tab), 
                 temporary=True)
    await tab.on(FetchEvent.AUTH_REQUIRED,
                 partial(self._tab_continue_request_with_auth_callback,
                         tab=tab,
                         proxy_username=creds[0],
                         proxy_password=creds[1]),
                 temporary=True)
```

**Scope:** Tab-level WebSocket connection → affects **only that specific tab**

#### Why Two Mechanisms?

| Aspect | Browser-Level | Tab-Level |
|--------|---------------|-----------|
| **Trigger** | Proxy in `ChromiumOptions` | Proxy in `create_browser_context()` |
| **WebSocket** | Browser-level connection | Tab-level connection |
| **Scope** | All tabs in default context | Only tabs in that context |
| **Efficiency** | One listener for all tabs | One listener per tab |
| **Isolation** | No context separation | Each context has different credentials |

**Design rationale for tab-level auth:**

- **Context isolation**: Each context can have a **different proxy** with **different credentials**
- **CDP limitation**: Fetch domain cannot be scoped to a specific context at browser level
- **Tradeoff**: Slightly less efficient (one listener per tab), but necessary for per-context proxy support

This architecture ensures **credentials never appear in CDP logs** and authentication is handled transparently.

!!! warning "Fetch Domain Side Effects"
    - **Browser-level Fetch**: Temporarily pauses **all requests across all tabs** in the default context until auth completes
    - **Tab-level Fetch**: Temporarily pauses **all requests in that specific tab** until auth completes
    
    This is a CDP limitation - Fetch enables request interception. After authentication completes, Fetch is disabled to minimize overhead.

## Initialization and Lifecycle

### Constructor Design

The Browser constructor initializes all internal components but **does not start the browser process**. This separation allows configuration before launch:

```python
class Browser(ABC):
    def __init__(
        self,
        options_manager: BrowserOptionsManager,
        connection_port: Optional[int] = None,
    ):
        # 1. Validate parameters
        self._validate_connection_port(connection_port)
        
        # 2. Initialize options via manager
        self.options = options_manager.initialize_options()
        
        # 3. Determine CDP port (random if not specified)
        self._connection_port = connection_port or randint(9223, 9322)
        
        # 4. Initialize specialized managers
        self._proxy_manager = ProxyManager(self.options)
        self._browser_process_manager = BrowserProcessManager()
        self._temp_directory_manager = TempDirectoryManager()
        self._connection_handler = ConnectionHandler(self._connection_port)
        
        # 5. Initialize state tracking
        self._tabs_opened: dict[str, Tab] = {}
        self._context_proxy_auth: dict[str, tuple[str, str]] = {}
        self._ws_address: Optional[str] = None
```

**Key design decisions:**

- **Lazy process start**: Constructor is synchronous; `start()` is async
- **Port flexibility**: Random port prevents collisions in parallel automation
- **Options manager pattern**: Strategy pattern for browser-specific configuration
- **Component composition**: Specialized managers instead of monolithic class

### Start Sequence

The `start()` method orchestrates browser launch and connection:

```python
async def start(self, headless: bool = False) -> Tab:
    # 1. Resolve binary location
    binary_location = self.options.binary_location or self._get_default_binary_location()
    
    # 2. Setup user data directory (temp or persistent)
    self._setup_user_dir()
    
    # 3. Extract proxy credentials (if private proxy)
    proxy_config = self._proxy_manager.get_proxy_credentials()
    
    # 4. Start browser process with arguments
    self._browser_process_manager.start_browser_process(
        binary_location, self._connection_port, self.options.arguments
    )
    
    # 5. Verify CDP endpoint is responsive
    await self._verify_browser_running()
    
    # 6. Configure proxy authentication (via Fetch domain)
    await self._configure_proxy(proxy_config[0], proxy_config[1])
    
    # 7. Get first valid target and create Tab
    valid_tab_id = await self._get_valid_tab_id(await self.get_targets())
    tab = Tab(self, target_id=valid_tab_id, connection_port=self._connection_port)
    self._tabs_opened[valid_tab_id] = tab
    
    return tab
```

!!! tip "Why start() Returns a Tab"
    This is a **design compromise** for ergonomics. Ideally, `start()` would only launch the browser, and users would call `new_tab()` separately. However, returning the initial tab reduces boilerplate for the 90% use case (single-tab automation). The tradeoff: the initial tab cannot be avoided even in multi-tab scenarios.

### Context Manager Protocol

The Browser implements `__aenter__` and `__aexit__` for automatic cleanup:

```python
async def __aexit__(self, exc_type, exc_val, exc_tb):
    # 1. Restore backup preferences (if modified)
    if self._backup_preferences_dir:
        shutil.copy2(self._backup_preferences_dir, ...)
    
    # 2. Check if browser is still running
    if await self._is_browser_running(timeout=2):
        await self.stop()
    
    # 3. Close WebSocket connection
    await self._connection_handler.close()
```

This ensures proper cleanup even if exceptions occur during automation.

## Browser Context Architecture

Browser contexts are Pydoll's most sophisticated isolation mechanism, providing **complete browsing environment separation** within a single browser process. Understanding their architecture is essential for advanced automation.

### CDP Hierarchy: Browser, Context, Target

CDP organizes browser structure into three levels:

```mermaid
graph TB
    Browser[Browser Process]
    Browser --> DefaultContext[Default BrowserContext]
    Browser --> Context1[BrowserContext ID: abc-123]
    Browser --> Context2[BrowserContext ID: def-456]
    
    DefaultContext --> Target1[Target/Page ID: page-1]
    DefaultContext --> Target2[Target/Page ID: page-2]
    
    Context1 --> Target3[Target/Page ID: page-3]
    
    Context2 --> Target4[Target/Page ID: page-4]
    Context2 --> Target5[Target/Page ID: page-5]
```

**Key concepts:**

1. **Browser Process**: Single Chromium instance with one CDP endpoint
2. **BrowserContext**: Isolated storage/cache/permission boundary (similar to incognito mode)
3. **Target**: Individual page, popup, worker, or background target

### Context Isolation Boundaries

Each browser context maintains **strict isolation** for:

| Resource | Isolation Level | Implementation |
|----------|----------------|----------------|
| Cookies | Full | Separate cookie jar per context |
| localStorage | Full | Separate storage per origin per context |
| IndexedDB | Full | Separate database per origin per context |
| Cache | Full | Independent HTTP cache per context |
| Permissions | Full | Context-specific permission grants |
| Network proxy | Full | Per-context proxy configuration |
| Authentication | Full | Independent auth state per context |

!!! info "Why Contexts Are Lightweight"
    Unlike launching multiple browser processes, contexts share the **rendering engine, GPU process, and network stack**. Only storage and state are isolated. This makes contexts 10-100x faster to create than new browser instances.

### Context Creation and Target Binding

Creating a context and target involves two CDP commands:

```python
# Step 1: Create isolated browsing context
response = await self._execute_command(
    TargetCommands.create_browser_context(
        proxy_server='http://proxy.example.com:8080',
        proxy_bypass_list='localhost,127.0.0.1'
    )
)
context_id = response['result']['browserContextId']

# Step 2: Create target (page) within that context
response = await self._execute_command(
    TargetCommands.create_target(
        browser_context_id=context_id  # Binds target to context
    )
)
target_id = response['result']['targetId']
```

**Critical detail:** The `browser_context_id` parameter **binds the target to the context's isolation boundary**. Without it, the target is created in the default context.

### Window Materialization in Headed Mode

In **headed mode** (visible UI), browser contexts have an important physical constraint:

- A context initially exists only **in memory** (no window)
- The **first target** created in a context **must** open a top-level window
- **Subsequent targets** can open as tabs within that window

This is a **CDP/Chromium limitation**, not a Pydoll design choice:

```python
# First target in context: MUST create window
tab1 = await browser.new_tab(browser_context_id=context_id)  # Opens new window

# Subsequent targets: CAN open as tabs in existing window
tab2 = await browser.new_tab(browser_context_id=context_id)  # Opens as tab
```

**Why does this matter?**

- In **headless mode**: Completely irrelevant (no windows rendered)
- In **headed mode**: First target per context will open a visible window
- In **test environments**: Multiple contexts → multiple windows (can be confusing)

!!! tip "Headless Contexts Are Cleaner"
    For CI/CD, scraping, or batch automation, use headless mode. Context isolation works identically, but without window materialization overhead.

### Context Deletion and Cleanup

Deleting a context **immediately closes all targets** within it:

```python
await browser.delete_browser_context(context_id)
# All tabs in this context are now closed
# All storage for this context is cleared
# Context cannot be reused (ID is invalid)
```

**Cleanup sequence:**

1. CDP sends `Target.disposeBrowserContext` command
2. Browser closes all targets in that context
3. Browser clears all storage for that context
4. Browser invalidates the context ID
5. Pydoll removes context from internal registries

## Event System at Browser Level

The Browser domain supports **browser-wide event listeners** that operate across all tabs and contexts. This is distinct from tab-level events.

### Browser vs Tab Event Scope

```python
# Browser-level event: applies to ALL tabs
await browser.on('Target.targetCreated', handle_new_target)

# Tab-level event: applies to ONE tab
await tab.on('Page.loadEventFired', handle_page_load)
```

**Architectural difference:**

- **Browser events** use the **browser-level WebSocket connection** (port-based or `ws://host/devtools/browser/...`)
- **Tab events** use **tab-level WebSocket connections** (`ws://host/devtools/page/<target_id>`)

### Fetch Domain: Global Request Interception

The Fetch domain can be enabled at **both** browser and tab levels, with different scopes:

```python
# Browser-level Fetch: intercepts requests for ALL tabs
await browser.enable_fetch_events(handle_auth_requests=True)
await browser.on('Fetch.requestPaused', handle_request)

# Tab-level Fetch: intercepts requests for ONE tab
await tab.enable_fetch_events(handle_auth_requests=True)
await tab.on('Fetch.requestPaused', handle_request)
```

**When to use each:**

| Use Case | Level | Reason |
|----------|-------|--------|
| Proxy authentication | Browser | Applies globally to all contexts |
| Ad blocking | Browser | Block ads across all tabs |
| API mocking | Tab | Mock specific API for specific test |
| Request logging | Tab | Log only relevant tab's requests |

!!! warning "Fetch Performance Impact"
    Enabling Fetch at the browser level **pauses all requests** across all tabs until callbacks execute. This adds latency to every request. Use tab-level Fetch when possible to minimize impact.

### Command Routing

All CDP commands flow through the Browser's connection handler:

```python
async def _execute_command(self, command, timeout=10):
    """
    Routes command to appropriate connection:
    - Browser-level commands → browser WebSocket
    - Tab-level commands → delegated to Tab instance
    """
    return await self._connection_handler.execute_command(command, timeout)
```

This centralized routing enables:

- **Request/response correlation**: Match responses to requests via ID
- **Timeout management**: Cancel commands that exceed timeout
- **Error handling**: Convert CDP errors to Python exceptions

## Resource Management

### Cookie and Storage Operations

The Browser domain exposes **browser-wide** and **context-specific** storage operations:

```python
# Browser-level operations (all contexts)
await browser.set_cookies(cookies)
await browser.get_cookies()
await browser.delete_all_cookies()

# Context-specific operations
await browser.set_cookies(cookies, browser_context_id=context_id)
await browser.get_cookies(browser_context_id=context_id)
await browser.delete_all_cookies(browser_context_id=context_id)
```

These operations use the **Storage domain** under the hood:

- `Storage.getCookies`: Retrieve cookies for context or all contexts
- `Storage.setCookies`: Set cookies with domain/path/expiry
- `Storage.clearCookies`: Clear cookies for context or all contexts

!!! info "Browser vs Tab Storage Scope"
    - **Browser-level**: Operates on entire browser or specific context
    - **Tab-level**: Scoped to tab's current origin
    
    Use browser-level for global cookie management (e.g., setting session cookies for all domains). Use tab-level for origin-specific operations (e.g., clearing cookies after logout).

### Permission Grants

The Browser domain provides **programmatic permission control**, bypassing browser prompts:

```python
await browser.grant_permissions(
    [PermissionType.GEOLOCATION, PermissionType.NOTIFICATIONS],
    origin='https://example.com',
    browser_context_id=context_id
)
```

**Architecture:**

- Permissions are granted via the `Browser.grantPermissions` CDP command
- Permissions are **context-specific** (isolated per context)
- Grants override default prompt behavior
- `reset_permissions()` reverts to default behavior

### Download Management

Download behavior is configured via the `Browser.setDownloadBehavior` command:

```python
await browser.set_download_behavior(
    behavior=DownloadBehavior.ALLOW,
    download_path='/path/to/downloads',
    events_enabled=True,  # Emit download progress events
    browser_context_id=context_id
)
```

**Options:**

- `ALLOW`: Save to specified path
- `DENY`: Cancel all downloads
- `DEFAULT`: Show browser's default download UI

### Window Management

Window operations apply to the **physical OS window** of a target:

```python
window_id = await browser.get_window_id_for_target(target_id)
await browser.set_window_bounds({
    'left': 100, 'top': 100,
    'width': 1920, 'height': 1080,
    'windowState': 'normal'  # or 'minimized', 'maximized', 'fullscreen'
})
```

**Implementation details:**

- Uses `Browser.getWindowForTarget` to resolve window ID from target ID
- `Browser.setWindowBounds` modifies window geometry
- **Headless mode**: Window operations are no-ops (no physical windows exist)

## Architectural Insights and Design Tradeoffs

### Singleton Tab Registry: Why?

The tab registry pattern (`_tabs_opened: dict[str, Tab]`) ensures that:

1. **Event routing works correctly**: CDP events contain a `targetId` but no Tab reference. The registry maps `targetId` → `Tab` for correct callback dispatch.
2. **State consistency**: Multiple code paths that reference the same target get the **same Tab instance**, preventing state divergence.
3. **Memory efficiency**: Without the registry, `get_opened_tabs()` would create duplicate Tab instances for every call.

**Tradeoff:** Memory usage grows with tab count, but this is unavoidable for stateful Tab instances.

### Why start() Returns a Tab

This design decision sacrifices purity for **ergonomics**:

- **Downside**: Initial tab cannot be avoided, even in multi-tab automation
- **Upside**: 90% of users (single-tab scripts) don't need boilerplate:

```python
# With start() returning Tab
tab = await browser.start()

# Without (pure design)
await browser.start()
tab = await browser.new_tab()
```

**Alternative explored:** Auto-close initial tab in `new_tab()`. Rejected because it's surprising behavior (implicit side effects).

### Proxy Authentication: Two-Level Architecture Tradeoff

Pydoll's proxy authentication uses two different Fetch domain strategies:

**Browser-Level (Global Proxy):**
- **Security benefit**: Credentials never logged in CDP traces
- **Performance cost**: Fetch pauses **all requests across all tabs** until auth completes
- **Efficiency**: Single listener for all tabs in default context
- **Mitigation**: Fetch is disabled after first auth, minimizing overhead

**Tab-Level (Per-Context Proxy):**
- **Security benefit**: Credentials never logged in CDP traces
- **Performance cost**: Fetch pauses **all requests in that tab** until auth completes
- **Efficiency**: Separate listener per tab (less efficient, but necessary for isolation)
- **Isolation benefit**: Each context can have different proxy credentials
- **Mitigation**: Fetch is disabled after first auth per tab

**Why not use Browser.setProxyAuth?** This CDP command doesn't exist. Fetch is the only mechanism for programmatic auth.

**Why tab-level for contexts?** CDP's Fetch domain cannot be scoped to a specific BrowserContext. Since each context can have a different proxy with different credentials, Pydoll must handle auth at the tab level to respect context boundaries.

### Port Randomization Strategy

Random CDP ports (9223-9322) prevent collisions when running parallel browser instances:

```python
self._connection_port = connection_port or randint(9223, 9322)
```

**Why not increment from 9222?**

- Race conditions in multi-process environments (e.g., pytest-xdist)
- Collision with user's manual port selection

**Tradeoff:** Random ports are harder to debug (can't hardcode). Solution: `browser._connection_port` exposes the chosen port.

### Component Separation: Why Managers?

The Browser class delegates to specialized managers (ProcessManager, ProxyManager, TempDirManager, ConnectionHandler) for:

1. **Testability**: Managers can be mocked independently
2. **Reusability**: ProxyManager logic shared across Browser implementations
3. **Maintainability**: Each manager has single responsibility
4. **Cross-platform**: OS-specific logic isolated in ProcessManager

**Tradeoff:** More indirection, but significantly better code organization at scale.

## Key Takeaways

1. **Browser is a coordinator**, not a monolith. It orchestrates managers and handles CDP communication.
2. **Tab registry ensures singleton instances** per target, critical for event routing and state consistency.
3. **Browser contexts are lightweight isolation**, sharing browser process but separating storage/cache/auth.
4. **Proxy auth via Fetch** is a security tradeoff - hides credentials but adds latency.
5. **Event system has two levels**: Browser-wide and tab-specific, with different WebSocket connections.
6. **Component separation** (managers) improves testability and cross-platform support.

## Related Documentation

For deeper understanding of related architectural components:

- **[Connection Layer](./connection-layer.md)**: WebSocket communication, command/response flow, async patterns
- **[Event Architecture](./event-architecture.md)**: Event dispatch, callback management, domain enabling
- **[Tab Domain](./tab-domain.md)**: Tab-level operations, page navigation, element finding
- **[CDP Deep Dive](./cdp.md)**: Chrome DevTools Protocol fundamentals
- **[Proxy Architecture](./proxy-architecture.md)**: Network-level proxy concepts and implementation

For practical usage patterns:

- **[Tab Management](../features/browser-management/tabs.md)**: Multi-tab automation patterns
- **[Browser Contexts](../features/browser-management/contexts.md)**: Context isolation in practice
- **[Proxy Configuration](../features/configuration/proxy.md)**: Setting up proxies and authentication


================================================
FILE: docs/en/deep-dive/architecture/browser-requests-architecture.md
================================================
# Browser-Context Requests Architecture

This document explores the architectural design of Pydoll's browser-context HTTP request system, which enables making HTTP requests that seamlessly inherit the browser's session state, cookies, and authentication.

!!! info "Practical Guide Available"
    This is the architectural deep dive. For practical examples and use cases, see [HTTP Requests Guide](../features/network/http-requests.md).

## Architectural Overview

Browser-context requests solve a fundamental problem in hybrid automation: maintaining session continuity between UI interactions and API calls. Traditional approaches require manually extracting cookies and headers, creating fragile coupling between browser and HTTP client.

Pydoll's architecture eliminates this complexity by executing HTTP requests **inside** the browser's JavaScript context, while leveraging CDP network events to capture comprehensive metadata that JavaScript alone cannot provide.

### Why This Architecture?

| Traditional Approach | Pydoll Architecture |
|---------------------|---------------------|
| Separate HTTP client (requests, aiohttp) | Unified browser-based execution |
| Manual cookie extraction and sync | Automatic cookie inheritance |
| Two separate session states | Single session state |
| Limited CORS handling | Browser-native CORS enforcement |
| Complex authentication flows | Transparent auth preservation |


## Component Architecture

The browser-context request system consists of two primary classes that work together with Pydoll's event system:

```mermaid
classDiagram
    class Tab {
        +request: Request
        +enable_network_events()
        +disable_network_events()
        +get_network_response_body()
        +on(event_name, callback)
        +clear_callbacks()
    }
    
    class Request {
        -tab: Tab
        -_network_events_enabled: bool
        -_requests_sent: list
        -_requests_received: list
        +get(url, params, kwargs)
        +post(url, data, json, kwargs)
        +put(url, data, json, kwargs)
        +patch(url, data, json, kwargs)
        +delete(url, kwargs)
        +head(url, kwargs)
        +options(url, kwargs)
        -_execute_fetch_request()
        -_register_callbacks()
        -_extract_headers()
        -_extract_cookies()
    }
    
    class Response {
        -_status_code: int
        -_content: bytes
        -_text: str
        -_json: dict
        -_response_headers: list
        -_request_headers: list
        -_cookies: list
        -_url: str
        +ok: bool
        +status_code: int
        +text: str
        +content: bytes
        +url: str
        +headers: list
        +request_headers: list
        +cookies: list
        +json()
        +raise_for_status()
    }
    
    Tab *-- Request
    Request ..> Response : creates
    Request ..> Tab : uses events
```

### Request Class

The `Request` class serves as the interface layer, providing a familiar `requests`-like API while orchestrating the complex interaction between JavaScript execution and network event monitoring.

**Key Responsibilities:**

- Translate Python method calls to Fetch API JavaScript
- Manage temporary network event listeners
- Accumulate network events during request execution
- Extract metadata from CDP events
- Construct Response objects with complete information

### Response Class

The `Response` class provides a `requests.Response`-compatible interface, making migration from traditional HTTP clients seamless.

**Key Features:**

- Multiple content accessors (text, bytes, JSON)
- Lazy JSON parsing with caching
- Comprehensive header information (both sent and received)
- Cookie extraction from Set-Cookie headers
- Final URL after redirects

## Execution Flow

The request execution follows a six-phase pipeline:

```mermaid
flowchart TD
    Start([tab.request.get#40;url#41;]) --> Phase1[<b>1. Preparation</b><br/>Build URL + options]
    
    Phase1 --> Phase2[<b>2. Event Registration</b><br/>Enable network events<br/>Register callbacks]
    
    Phase2 --> Phase3[<b>3. JavaScript Execution</b><br/>Runtime.evaluate&#40;fetch&#41;]
    
    Phase3 --> Phase4{<b>4. Network Activity</b>}
    Phase4 -->|Request sent| Event1[REQUEST_WILL_BE_SENT]
    Phase4 -->|Response received| Event2[RESPONSE_RECEIVED]
    Phase4 -->|Extra info| Event3[*_EXTRA_INFO events]
    
    Event1 --> Collect[Collect metadata]
    Event2 --> Collect
    Event3 --> Collect
    
    Collect --> Phase5[<b>5. Construction</b><br/>Extract headers/cookies<br/>Build Response object]
    
    Phase5 --> Phase6[<b>6. Cleanup</b><br/>Clear callbacks<br/>Disable events]
    
    Phase6 --> End([Return Response])
```

### Phase Details

| Phase | Layer | Key Operations | Asynchronous |
|-------|-------|----------------|--------------|
| **1. Preparation** | Request | URL building, options formatting | No |
| **2. Event Registration** | Tab | Enable events, register callbacks | Yes |
| **3. JavaScript Execution** | CDP/Browser | Execute fetch() in browser context | Yes |
| **4. Network Activity** | Browser/CDP | HTTP request, emit CDP events | Yes (parallel) |
| **5. Construction** | Request | Parse events, build Response | No |
| **6. Cleanup** | Tab | Remove callbacks, disable events | Yes |

## Event System Integration

Browser-context requests are tightly integrated with Pydoll's event system architecture. Understanding this relationship is crucial.

### Temporary Event Lifecycle

```mermaid
stateDiagram-v2
    [*] --> NoEvents: Request starts
    NoEvents --> EventsEnabled: Enable network events
    EventsEnabled --> CallbacksRegistered: Register callbacks
    CallbacksRegistered --> ExecutingRequest: Execute fetch
    ExecutingRequest --> CapturingEvents: Events fire
    CapturingEvents --> ExecutingRequest: More events
    ExecutingRequest --> CleaningUp: Fetch completes
    CleaningUp --> CallbacksRemoved: Clear callbacks
    CallbacksRemoved --> EventsDisabled: Disable if needed
    EventsDisabled --> [*]: Request complete
```

### Why Both JavaScript and Events?

A common question: if JavaScript can execute the request, why use network events?

| Information Source | JavaScript (Fetch API) | Network Events (CDP) |
|-------------------|------------------------|----------------------|
| Response status | Available | Available |
| Response body | Available | Not available |
| Response headers | Partial (CORS restricted) | Complete |
| Request headers | Not accessible | Complete |
| Set-Cookie headers | Hidden by browser | Available |
| Timing information | Limited | Comprehensive |
| Redirect chain | Only final URL | Full chain |

**The Solution:** Combine both sources for complete information.

!!! tip "Complementary Technologies"
    JavaScript provides the response body and triggers the request in the browser's context (with cookies, auth). Network events provide the metadata that JavaScript security policies hide.

### CDP Network Event Types

The architecture uses four CDP event types to capture complete metadata:

| Event | Purpose | Key Information |
|-------|---------|----------------|
| `REQUEST_WILL_BE_SENT` | Main outgoing request | URL, method, standard headers |
| `REQUEST_WILL_BE_SENT_EXTRA_INFO` | Additional request metadata | Associated cookies, raw headers |
| `RESPONSE_RECEIVED` | Main response received | Status, headers, MIME type, timing |
| `RESPONSE_RECEIVED_EXTRA_INFO` | Additional response metadata | Set-Cookie headers, security info |

!!! info "Event Multiplicity"
    A single HTTP request generates multiple CDP events. The Request class accumulates all related events and extracts non-duplicate information during the construction phase.

## Header and Cookie Architecture

### Header Extraction Strategy

Headers exist in multiple CDP events with potential duplication. The architecture uses a deduplication strategy:

```mermaid
flowchart TD
    A[Network Events] --> B{Event Type}
    B -->|REQUEST events| C[Extract Sent Headers]
    B -->|RESPONSE events| D[Extract Received Headers]
    
    C --> E[Deduplicate by name+value]
    D --> F[Deduplicate by name+value]
    
    E --> G[Request Headers List]
    F --> H[Response Headers List]
    
    G --> I[Response Object]
    H --> I
```

**Deduplication Logic:**

1. Events are processed in order
2. Each header is identified by `(name, value)` tuple
3. Only first occurrence of each tuple is kept
4. Result: unique, non-redundant header list

### Cookie Parsing Architecture

Cookies require special handling because they come from `Set-Cookie` headers in `RESPONSE_RECEIVED_EXTRA_INFO` events:

```mermaid
flowchart TD
    A[RESPONSE_RECEIVED_EXTRA_INFO] --> B[Extract Set-Cookie headers]
    B --> C{Multi-line header?}
    C -->|Yes| D[Split by newline]
    C -->|No| E[Parse single cookie]
    D --> F[Parse each line]
    F --> G[Extract name=value]
    E --> G
    G --> H{Valid name?}
    H -->|Yes| I[Create CookieParam]
    H -->|No| J[Discard]
    I --> K[Add to cookie list]
    K --> L[Deduplicate]
    L --> M[Response Object]
```

**Cookie Extraction Principles:**

- Only `EXTRA_INFO` events contain `Set-Cookie` headers
- Cookie attributes (Path, Domain, Secure, HttpOnly) are ignored
- Browser manages cookie attributes internally
- Only name-value pairs are extracted for informational purposes

!!! warning "Cookie Scope"
    The `Response.cookies` property contains only **new or updated** cookies from this specific response. Existing browser cookies are managed automatically and not exposed through this interface.

## JavaScript Execution Context

The Fetch API execution happens in the browser's JavaScript context, which is key to the architecture's power:

### Fetch API Integration

The request is translated to JavaScript:

```javascript
// Simplified representation
(async () => {
    const response = await fetch(url, {
        method: 'GET',
        headers: {'X-Custom': 'value'},
        // Browser automatically adds:
        // - Cookie header
        // - Authorization if set
        // - Standard headers (User-Agent, Accept, etc.)
    });
    
    return {
        status: response.status,
        url: response.url,  // Final URL after redirects
        text: await response.text(),
        content: new Uint8Array(await response.arrayBuffer()),
        json: response.headers.get('Content-Type')?.includes('application/json')
            ? await response.clone().json()
            : null
    };
})()
```

### Browser Context Benefits

Executing in the browser context provides:

| Benefit | Description |
|---------|-------------|
| **Automatic Cookie Inclusion** | Browser sends all applicable cookies automatically |
| **Auth State Preservation** | Authentication headers maintained from browser session |
| **CORS Enforcement** | Browser applies same CORS policies as user interactions |
| **TLS/SSL Handling** | Browser's certificate validation and security policies apply |
| **Compression** | Automatic handling of gzip, br, deflate |
| **Redirects** | Browser follows redirects transparently |
| **Same Security Context** | Request appears identical to user-initiated requests |

!!! info "Anti-Bot Detection"
    Requests executed in the browser context are indistinguishable from user-initiated requests, making them effective against anti-bot systems that analyze request patterns.

## Performance Considerations

### Event Overhead

Network events add overhead to request execution:

| Scenario | Overhead | Recommendation |
|----------|----------|----------------|
| Single request | Low | Acceptable |
| Multiple sequential requests | Moderate | Enable events once |
| Bulk requests (100+) | High | Consider enabling events at tab level |
| Long-running automation | Memory concern | Disable when done |

### Optimization Pattern

```python
# Inefficient - events enabled/disabled repeatedly
for url in urls:
    response = await tab.request.get(url)

# Efficient - events enabled once
await tab.enable_network_events()
for url in urls:
    response = await tab.request.get(url)
await tab.disable_network_events()
```

!!! tip "Automatic Optimization"
    The Request class checks if network events are already enabled and skips redundant enable/disable operations automatically.

### JSON Parsing Strategy

Response JSON parsing uses lazy evaluation with caching:

1. First call to `response.json()`: Parse and cache
2. Subsequent calls: Return cached result
3. If JSON pre-parsed during construction: Use that

This prevents redundant parsing overhead.

## Security Architecture

### CORS Policy Enforcement

Browser-context requests respect CORS policies:

```mermaid
flowchart TD
    A[tab.request.get&#40;url&#41;] --> B{Same Origin?}
    B -->|Yes| C[Request Allowed]
    B -->|No| D{CORS Headers Present?}
    D -->|Yes| E[Request Allowed]
    D -->|No| F[Request Blocked]
    
    C --> G[Response Returned]
    E --> G
    F --> H[CORS Error]
```

**CORS Behavior:**

- Requests to same origin: Always allowed
- Cross-origin requests: Require CORS headers from server
- Opaque responses: May be blocked by browser

**Workaround for CORS Issues:**

Navigate to the domain first to establish same-origin context:

```python
await tab.go_to('https://different-domain.com')
response = await tab.request.get('https://different-domain.com/api')
```

### Cookie Security

Cookies with security flags (`HttpOnly`, `Secure`, `SameSite`) are handled by the browser:

- **HttpOnly cookies**: Sent automatically but not exposed to JavaScript or CDP
- **Secure cookies**: Only sent over HTTPS
- **SameSite cookies**: Browser enforces SameSite policies

The `Response.cookies` property may not show all cookies due to these security restrictions.

### TLS/SSL Validation

The browser validates SSL certificates. Self-signed or invalid certificates cause requests to fail unless:

```python
options = ChromiumOptions()
options.add_argument('--ignore-certificate-errors')
browser = Chrome(options=options)
```

!!! warning "Security Trade-off"
    Disabling certificate validation reduces security. Only use in controlled environments.

## Limitations and Design Decisions

### Request Body Size

Very large request bodies (files, large datasets) have JavaScript memory constraints. For file uploads, use `WebElement.set_input_files()` or the file chooser interceptor instead.

### Binary Response Handling

Binary responses are converted through JavaScript's `ArrayBuffer` and `Uint8Array`, which adds some overhead for very large responses (>100MB).

### Redirect Transparency

The Fetch API follows redirects automatically. Only the final URL is captured. If you need the redirect chain, use network monitoring separately.

### Event Timing

Events must be registered **before** executing the fetch. The architecture ensures this through the registration phase, but manual event handling requires careful timing.

## Architectural Principles

The browser-context request architecture adheres to these principles:

1. **Session Continuity**: Never break the browser's session state
2. **Zero Manual Sync**: No cookie/header extraction required
3. **Complete Information**: Combine JavaScript + events for full metadata
4. **Automatic Cleanup**: Resources freed after each request
5. **Familiar Interface**: `requests`-compatible API for easy adoption
6. **Performance Conscious**: Optimize for common use cases
7. **Security Aware**: Respect browser security policies

## Integration with Other Systems

### Event System Dependency

Browser-context requests depend on the event system architecture:

- Leverages `Tab.on()` for callback registration
- Uses `Tab.clear_callbacks()` for cleanup
- Respects existing network event enablement
- Integrates with event lifecycle management

See [Event System Architecture](event-architecture.md) for details.

### Type System Integration

The architecture uses Python's type system extensively:

- `HeaderEntry` TypedDict for headers
- `CookieParam` TypedDict for cookies
- Event type definitions from `pydoll.protocol.network.events`
- Provides IDE autocomplete and type safety

See [Typing System](typing-system.md) for details.

## Further Reading

- **[HTTP Requests Guide](../features/network/http-requests.md)** - Practical examples and use cases
- **[Event System Architecture](event-architecture.md)** - Event system internal design
- **[Network Monitoring](../features/network/monitoring.md)** - Passive network observation
- **[Request Interception](../features/network/interception.md)** - Active request modification
- **[Typing System](typing-system.md)** - Type system integration

## Summary

Pydoll's browser-context request architecture achieves seamless HTTP communication by combining JavaScript Fetch API execution with CDP network event monitoring. This hybrid approach provides:

- **Complete metadata** from both JavaScript and CDP events
- **Automatic session continuity** through browser context execution  
- **Familiar interface** compatible with the requests library
- **Performance optimization** through event reuse
- **Security compliance** with browser policies

The architecture demonstrates how combining complementary technologies (JavaScript + CDP events) can solve complex problems elegantly, providing power and convenience without compromising on completeness or security.


================================================
FILE: docs/en/deep-dive/architecture/event-architecture.md
================================================
# Event System Architecture

This document explores the internal architecture of Pydoll's event system, covering WebSocket communication, event flow, callback management, and performance considerations.

!!! info "Practical Usage Guide"
    For practical examples and usage patterns, see the [Event System Guide](../features/advanced/event-system.md).

## WebSocket Communication and CDP

At the core of Pydoll's event system is the Chrome DevTools Protocol (CDP), which provides a structured way to interact with and monitor browser activities over WebSocket connections. This bidirectional communication channel allows your code to both send commands to the browser and receive events back.

```mermaid
sequenceDiagram
    participant Client as Pydoll Code
    participant Connection as ConnectionHandler
    participant WebSocket
    participant Browser
    
    Client->>Connection: Register callback for event
    Connection->>Connection: Store callback in registry
    
    Client->>Connection: Enable event domain
    Connection->>WebSocket: Send CDP command to enable domain
    WebSocket->>Browser: Forward command
    Browser-->>WebSocket: Acknowledge domain enabled
    WebSocket-->>Connection: Forward response
    Connection-->>Client: Domain enabled
    
    Browser->>WebSocket: Event occurs, sends CDP event message
    WebSocket->>Connection: Forward event message
    Connection->>Connection: Look up callbacks for this event
    Connection->>Client: Execute registered callback
```

### WebSocket Communication Model

The WebSocket connection between Pydoll and the browser follows this pattern:

1. **Connection Establishment**: When the browser starts, a WebSocket server is created, and Pydoll establishes a connection to it
2. **Bidirectional Messaging**: Both Pydoll and the browser can send messages at any time
3. **Message Types**:
   - **Commands**: Sent from Pydoll to the browser (e.g., navigation, DOM manipulation)
   - **Command Responses**: Sent from the browser to Pydoll in response to commands
   - **Events**: Sent from the browser to Pydoll when something happens (e.g., page load, network activity)

### Chrome DevTools Protocol Structure

CDP organizes its functionality into domains, each responsible for a specific area of browser functionality:

| Domain | Responsibility | Typical Events |
|--------|----------------|----------------|
| Page | Page lifecycle | Load events, navigation, dialogs |
| Network | Network activity | Request/response monitoring, WebSockets |
| DOM | Document structure | DOM changes, attribute modifications |
| Fetch | Request interception | Request paused, authentication required |
| Runtime | JavaScript execution | Console messages, exceptions |
| Browser | Browser management | Window creation, tabs, contexts |

Each domain must be explicitly enabled before it will emit events, which helps manage performance by only processing events that are actually needed.

## Domain Architecture

### The Enable/Disable Pattern

The explicit enable/disable pattern serves several important architectural purposes:

1. **Performance Optimization**: By only enabling domains you're interested in, you reduce the overhead of event processing
2. **Resource Management**: Some event domains (like Network or DOM monitoring) can generate large volumes of events that consume memory
3. **Protocol Compliance**: CDP requires explicit domain enabling before events are emitted
4. **Controlled Cleanup**: Explicitly disabling domains ensures proper cleanup when events are no longer needed

```mermaid
stateDiagram-v2
    [*] --> Disabled: Initial State
    Disabled --> Enabled: enable_xxx_events()
    Enabled --> Disabled: disable_xxx_events()
    Enabled --> [*]: Tab Closed
    Disabled --> [*]: Tab Closed
```

!!! warning "Event Leak Prevention"
    Failing to disable event domains when they're no longer needed can lead to memory leaks and performance degradation, especially in long-running automation. Always disable event domains when you're done with them, particularly for high-volume events like network monitoring.

### Domain-Specific Enabling Methods

Different domains are enabled through specific methods on the appropriate objects:

| Domain | Enable Method | Disable Method | Available On |
|--------|--------------|----------------|--------------|
| Page | `enable_page_events()` | `disable_page_events()` | Tab |
| Network | `enable_network_events()` | `disable_network_events()` | Tab |
| DOM | `enable_dom_events()` | `disable_dom_events()` | Tab |
| Fetch | `enable_fetch_events()` | `disable_fetch_events()` | Tab, Browser |
| File Chooser | `enable_intercept_file_chooser_dialog()` | `disable_intercept_file_chooser_dialog()` | Tab |

!!! info "Domain Ownership"
    Events belong to specific domains based on their functionality. Some domains are only available at certain levels - for instance, Page events are available on the Tab instance but not directly at the Browser level.

## Event Registration System

### The `on()` Method

The central method for subscribing to events is the `on()` method, available on both Tab and Browser instances:

```python
async def on(
    self, event_name: str, callback: callable, temporary: bool = False
) -> int:
    """
    Registers an event listener.

    Args:
        event_name (str): The event name to listen for.
        callback (callable): The callback function to execute when the
            event is triggered.
        temporary (bool): If True, the callback will be removed after it's
            triggered once. Defaults to False.

    Returns:
        int: The ID of the registered callback.
    """
```

This method returns a callback ID that can be used to remove the callback later if needed.

### Callback Registry

Internally, the `ConnectionHandler` maintains a callback registry:

```python
{
    'Page.loadEventFired': [
        (callback_id_1, callback_function_1, temporary=False),
        (callback_id_2, callback_function_2, temporary=True),
    ],
    'Network.requestWillBeSent': [
        (callback_id_3, callback_function_3, temporary=False),
    ]
}
```

When an event arrives via WebSocket:

1. The event name is extracted from the message
2. The registry is queried for matching callbacks
3. Each callback is executed with the event data
4. Temporary callbacks are removed after execution

### Async Callback Handling

Callbacks can be either synchronous or asynchronous. The event system handles both:

```python
async def _trigger_callbacks(self, event_name: str, event_data: dict):
    for cb_id, cb_data in self._event_callbacks.items():
        if cb_data['event'] == event_name:
            if asyncio.iscoroutinefunction(cb_data['callback']):
                await cb_data['callback'](event_data)
            else:
                cb_data['callback'](event_data)
```

Asynchronous callbacks are awaited sequentially. This means each callback completes before the next one executes, which is important for:

- **Predictable Execution Order**: Callbacks execute in registration order
- **Error Handling**: Exceptions in one callback don't prevent others from executing
- **State Consistency**: Callbacks can rely on sequential state changes

!!! info "Sequential vs Concurrent Execution"
    Callbacks execute sequentially within the same event. However, different events can be processed concurrently since the event loop handles multiple connections simultaneously.

## Event Flow and Lifecycle

The event lifecycle follows these steps:

```mermaid
flowchart TD
    A[Browser Activity] -->|Generates| B[CDP Event]
    B -->|Sent via WebSocket| C[ConnectionHandler]
    C -->|Filters by Event Name| D{Registered Callbacks?}
    D -->|Yes| E[Process Event]
    D -->|No| F[Discard Event]
    E -->|For Each Callback| G[Execute Callback]
    G -->|If Temporary| H[Remove Callback]
    G -->|If Permanent| I[Retain for Future Events]
```

### Detailed Flow

1. **Browser Activity**: Something happens in the browser (page loads, request sent, DOM changes)
2. **CDP Event Generation**: Browser generates a CDP event message
3. **WebSocket Transmission**: Message is sent over WebSocket to Pydoll
4. **Event Reception**: The ConnectionHandler receives the event
5. **Callback Lookup**: ConnectionHandler checks its registry for callbacks matching the event name
6. **Callback Execution**: If callbacks exist, each is executed with the event data
7. **Temporary Removal**: If a callback was registered as temporary, it's removed after execution

## Browser-Level vs. Tab-Level Events

Pydoll's event system operates at both the browser and tab levels, with important distinctions:

```mermaid
graph TD
    Browser[Browser Instance] -->|"Global Events (e.g., Target events)"| BrowserCallbacks[Browser-Level Callbacks]
    Browser -->|"Creates"| Tab1[Tab Instance 1]
    Browser -->|"Creates"| Tab2[Tab Instance 2]
    Tab1 -->|"Tab-Specific Events"| Tab1Callbacks[Tab 1 Callbacks]
    Tab2 -->|"Tab-Specific Events"| Tab2Callbacks[Tab 2 Callbacks]
```

### Browser-Level Events

Browser-level events operate globally across all tabs. These are limited to specific domains like:

- **Target Events**: Tab creation, destruction, crash
- **Browser Events**: Window management, download coordination

```python
# Browser-level event registration
await browser.on('Target.targetCreated', handle_new_target)
```

Browser-level event domains are limited, and trying to use tab-specific events will raise an exception.

### Tab-Level Events

Tab-level events are specific to an individual tab:

```python
# Each tab has its own event context
tab1 = await browser.start()
tab2 = await browser.new_tab()

await tab1.enable_page_events()
await tab1.on(PageEvent.LOAD_EVENT_FIRED, handle_tab1_load)

await tab2.enable_page_events()
await tab2.on(PageEvent.LOAD_EVENT_FIRED, handle_tab2_load)
```

This architecture allows for:

- **Isolated Event Handling**: Events in one tab don't affect others
- **Per-Tab Configuration**: Different tabs can monitor different event types
- **Resource Efficiency**: Only enable events on tabs that need them

!!! info "Domain-Specific Scope"
    Not all event domains are available at both levels:
    
    - **Fetch Events**: Available at both browser and tab levels
    - **Page Events**: Available only at the tab level
    - **Target Events**: Available only at the browser level

## Performance Architecture

### Event System Overhead

The event system adds overhead to browser automation, especially for high-frequency events:

| Event Domain | Typical Event Volume | Performance Impact |
|--------------|---------------------|-------------------|
| Page | Low | Minimal |
| Network | High | Moderate to High |
| DOM | Very High | High |
| Fetch | Moderate | Moderate (higher if intercepting) |

### Performance Optimization Strategies

1. **Selective Domain Enabling**: Only enable event domains you're actively using
2. **Strategic Scoping**: Use browser-level events only for truly browser-wide concerns
3. **Timely Disabling**: Always disable event domains when you're finished with them
4. **Early Filtering**: In callbacks, filter out irrelevant events as early as possible
5. **Temporary Callbacks**: Use the `temporary=True` flag for one-time events

### Memory Management

The event system manages memory through several mechanisms:

1. **Callback Registry Cleanup**: Removing callbacks frees their references
2. **Temporary Auto-Removal**: Temporary callbacks are automatically cleaned up
3. **Domain Disabling**: Disabling a domain stops event generation
4. **Tab Closure**: When a tab closes, all its callbacks are automatically removed

!!! warning "Memory Leak Prevention"
    In long-running automation, always clean up callbacks and disable domains when done. High-frequency events (especially DOM) can accumulate significant memory if left enabled.

## Connection Handler Architecture

The `ConnectionHandler` is the central component managing WebSocket communication and event dispatching.

### Key Responsibilities

1. **WebSocket Management**: Establishing and maintaining the WebSocket connection
2. **Message Routing**: Distinguishing between command responses and events
3. **Callback Registry**: Maintaining the mapping of event names to callbacks
4. **Event Dispatching**: Executing registered callbacks when events arrive
5. **Cleanup**: Removing callbacks and closing connections

### Internal Structure

```python
class ConnectionHandler:
    def __init__(self, ...):
        self._events_handler = EventsManager()
        self._websocket = None
        # ... other attributes
    
    async def register_callback(self, event_name, callback, temporary):
        return self._events_handler.register_callback(event_name, callback, temporary)

class EventsManager:
    def __init__(self):
        self._event_callbacks = {}  # Callback ID -> callback data
        self._callback_id = 0
    
    def register_callback(self, event_name, callback, temporary):
        self._callback_id += 1
        self._event_callbacks[self._callback_id] = {
            'event': event_name,
            'callback': callback,
            'temporary': temporary
        }
        return self._callback_id
    
    async def _trigger_callbacks(self, event_name, event_data):
        callbacks_to_remove = []
        
        for cb_id, cb_data in self._event_callbacks.items():
            if cb_data['event'] == event_name:
                # Execute callback (await if async, call directly if sync)
                if asyncio.iscoroutinefunction(cb_data['callback']):
                    await cb_data['callback'](event_data)
                else:
                    cb_data['callback'](event_data)
                
                # Mark temporary callbacks for removal
                if cb_data['temporary']:
                    callbacks_to_remove.append(cb_id)
        
        # Remove temporary callbacks after all callbacks executed
        for cb_id in callbacks_to_remove:
            self.remove_callback(cb_id)
```

This architecture ensures:

- **Efficient Lookup**: Event names map directly to callback lists
- **Minimal Overhead**: Only registered events are processed
- **Automatic Cleanup**: Temporary callbacks are removed after execution
- **Thread Safety**: Operations are async-safe

## Event Message Format

CDP events follow a standardized message format:

```json
{
    "method": "Network.requestWillBeSent",
    "params": {
        "requestId": "1234.56",
        "loaderId": "7890.12",
        "documentURL": "https://example.com",
        "request": {
            "url": "https://api.example.com/data",
            "method": "GET",
            "headers": {...}
        },
        "timestamp": 123456.789,
        "wallTime": 1234567890.123,
        "initiator": {...},
        "type": "XHR"
    }
}
```

Key components:

- **`method`**: The event name in `Domain.eventName` format
- **`params`**: Event-specific data, varies by event type
- **No `id` field**: Unlike commands, events don't have request IDs

The event system extracts the `method` field to route to the appropriate callbacks, passing the entire message to each callback.

## Multi-Tab Event Coordination

Pydoll's architecture supports sophisticated multi-tab event coordination:

### Independent Tab Contexts

Each tab maintains its own:

- Event domain enablement state
- Callback registry
- Event communication channel
- Network logs (if network events enabled)

!!! info "Communication Architecture"
    Each tab has its own event communication channel to the browser. For technical details on how WebSocket connections and target IDs work at the protocol level, see [Browser Domain Architecture](./browser-domain.md).

### Shared Browser Context

Multiple tabs can share:

- Browser-level event listeners
- Cookie storage
- Cache
- Browser process

This architecture allows for:

1. **Parallel Event Processing**: Multiple tabs can process events simultaneously
2. **Isolated Failures**: Issues in one tab don't affect others
3. **Resource Sharing**: Common browser features are shared efficiently
4. **Coordinated Actions**: Browser-level events can coordinate cross-tab activities

## Conclusion

Pydoll's event system architecture is designed for:

- **Performance**: Minimal overhead through selective domain enabling and efficient callback dispatch
- **Flexibility**: Support for both browser-level and tab-level events
- **Scalability**: Handle multiple tabs with independent event contexts
- **Reliability**: Automatic cleanup and memory management

Understanding this architecture helps you:

- **Optimize Performance**: Know which domains have high overhead
- **Debug Issues**: Understand the event flow when things don't work as expected
- **Design Better Automation**: Leverage the architecture for efficient event-driven workflows
- **Avoid Pitfalls**: Prevent memory leaks and performance degradation

For practical usage patterns and examples, see the [Event System Guide](../features/advanced/event-system.md).


================================================
FILE: docs/en/deep-dive/architecture/find-elements-mixin.md
================================================
# FindElements Mixin Architecture

The FindElementsMixin represents a critical architectural decision in Pydoll: using **composition over inheritance** to share element-finding capabilities between `Tab` and `WebElement` without coupling them through a common base class. This document explores the mixin pattern, its implementation, and the internal mechanics of element location.

!!! info "Practical Usage Guide"
    For practical examples and usage patterns, see the [Element Finding Guide](../features/automation/element-finding.md) and [Selectors Guide](./selectors-guide.md).

## Mixin Pattern: Design Philosophy

### What is a Mixin?

A mixin is a class designed to **provide methods to other classes** without being a base class in a traditional inheritance hierarchy. Unlike standard inheritance (which models "is-a" relationships), mixins model **"can-do" capabilities**.

```python
# Traditional inheritance: "is-a"
class Animal:
    def breathe(self): ...

class Dog(Animal):  # Dog IS-A Animal
    def bark(self): ...

# Mixin pattern: "can-do"
class FlyableMixin:
    def fly(self): ...

class Bird(Animal, FlyableMixin):  # Bird IS-A Animal, CAN fly
    pass
```

### Why Mixins Over Inheritance?

Pydoll faces a specific architectural challenge:

- **`Tab`** needs to find elements in the **document context**
- **`WebElement`** needs to find elements **relative to itself** (child elements)
- Both need **identical selector logic** (CSS, XPath, attribute building)

**Option 1: Shared Base Class**

```python
class ElementLocator:
    def find(...): ...

class Tab(ElementLocator):
    pass

class WebElement(ElementLocator):
    pass
```

**Problems:**
- Tight coupling: `Tab` and `WebElement` now share inheritance hierarchy
- Violates Single Responsibility: `Tab` shouldn't inherit from same class as `WebElement`
- Hard to extend: Adding new capabilities requires modifying base class

**Option 2: Mixin Pattern (Chosen Approach)**

```python
class FindElementsMixin:
    def find(...): ...
    def query(...): ...

class Tab(FindElementsMixin):
    # Tab-specific logic
    pass

class WebElement(FindElementsMixin):
    # WebElement-specific logic
    pass
```

**Benefits:**

- **Decoupling**: `Tab` and `WebElement` remain independent
- **Reusability**: Same element-finding logic in both classes
- **Composability**: Can add other mixins without conflicts
- **Testability**: Mixin can be tested in isolation

!!! tip "Mixin Characteristics"
    1. **Stateless**: Mixins don't maintain their own state (no `__init__`)
    2. **Dependency Injection**: Assumes consuming class provides dependencies (e.g., `_connection_handler`)
    3. **Single Purpose**: Each mixin provides one cohesive capability
    4. **Not Instantiable**: Never create `FindElementsMixin()` directly

## Mixin Implementation in Pydoll

### Class Structure

The FindElementsMixin uses **dependency injection** to work with any class that provides a `_connection_handler`:

```python
class FindElementsMixin:
    """
    Mixin providing element finding capabilities.
    
    Assumes the consuming class has:
    - _connection_handler: ConnectionHandler instance for CDP commands
    - _object_id: Optional[str] for context-relative searches (WebElement only)
    """
    
    if TYPE_CHECKING:
        _connection_handler: ConnectionHandler  # Type hint, not actual attribute
    
    async def find(self, ...):
        # Implementation uses self._connection_handler
        # Checks for self._object_id to determine context
```

**Key insight:** The mixin doesn't define `_connection_handler` or `_object_id`. It **assumes** they exist via duck typing.

### How Tab and WebElement Use the Mixin

```python
# Tab: Document-level searches
class Tab(FindElementsMixin):
    def __init__(self, browser, target_id, connection_port):
        self._connection_handler = ConnectionHandler(connection_port)
        # No _object_id → searches from document root

# WebElement: Element-relative searches
class WebElement(FindElementsMixin):
    def __init__(self, object_id, connection_handler, ...):
        self._object_id = object_id  # CDP object ID
        self._connection_handler = connection_handler
        # Has _object_id → searches relative to this element
```

**Critical distinction:**

- **Tab**: `hasattr(self, '_object_id')` → `False` → uses `RuntimeCommands.evaluate()` (document context)
- **WebElement**: `hasattr(self, '_object_id')` → `True` → uses `RuntimeCommands.call_function_on()` (element context)

### Context Detection

The mixin dynamically detects search context:

```python
async def _find_element(self, by, value, raise_exc=True):
    if hasattr(self, '_object_id'):
        # Relative search: call JavaScript function on THIS element
        command = self._get_find_element_command(by, value, self._object_id)
    else:
        # Document search: evaluate JavaScript in global context
        command = self._get_find_element_command(by, value)
    
    response = await self._execute_command(command)
    # ...
```

This single implementation handles both:

- `tab.find(id='submit')` → searches entire document
- `form_element.find(id='submit')` → searches within `form_element`

!!! warning "Mixin Dependency Coupling"
    The mixin is **tightly coupled** to CDP's object model. It assumes:
    
    - Elements are represented by `objectId` strings
    - `Runtime.evaluate()` for document searches
    - `Runtime.callFunctionOn()` for element-relative searches
    
    This is acceptable because Pydoll is **CDP-specific**. A more generic design would require abstraction layers.

## Public API Design

The mixin exposes two high-level methods with distinct design philosophies:

### find(): Attribute-Based Selection

```python
@overload
async def find(self, find_all: Literal[False], ...) -> WebElement: ...

@overload
async def find(self, find_all: Literal[True], ...) -> list[WebElement]: ...

async def find(
    self,
    id: Optional[str] = None,
    class_name: Optional[str] = None,
    name: Optional[str] = None,
    tag_name: Optional[str] = None,
    text: Optional[str] = None,
    timeout: int = 0,
    find_all: bool = False,
    raise_exc: bool = True,
    **attributes,
) -> Union[WebElement, list[WebElement], None]:
```

**Design decisions:**

1. **Kwargs over positional By enum**:
   ```python
   # Pydoll (intuitive)
   await tab.find(id='submit', class_name='primary')
   
   # Selenium (verbose)
   driver.find_element(By.ID, 'submit')  # Can't combine attributes easily
   ```

2. **Auto-resolution to optimal selector**:
   - Single attribute → uses `By.ID`, `By.CLASS_NAME`, etc. (fastest)
   - Multiple attributes → builds XPath (flexible but slower)

3. **`**attributes` for extensibility**:
   ```python
   await tab.find(data_testid='submit-btn', aria_label='Submit form')
   # Builds: //\*[@data-testid='submit-btn' and @aria-label='Submit form']
   ```

### query(): Expression-Based Selection

```python
@overload
async def query(self, expression, find_all: Literal[False], ...) -> WebElement: ...

@overload
async def query(self, expression, find_all: Literal[True], ...) -> list[WebElement]: ...

async def query(
    self, 
    expression: str, 
    timeout: int = 0, 
    find_all: bool = False, 
    raise_exc: bool = True
) -> Union[WebElement, list[WebElement], None]:
```

**Design decisions:**

1. **Auto-detect CSS vs XPath**:
   ```python
   # XPath detection (starts with / or ./)
   await tab.query("//div[@id='content']")
   
   # CSS detection (default)
   await tab.query("div#content > p.intro")
   ```

2. **Single expression parameter** (unlike `find()`):
   - Assumes user knows selector syntax
   - No abstraction overhead

3. **Direct passthrough to browser**:
   - `querySelector()` / `querySelectorAll()` for CSS
   - `document.evaluate()` for XPath

### Overload Pattern for Type Safety

Both methods use `@overload` to provide **precise return types**:

```python
# IDE knows return type is WebElement
element = await tab.find(id='submit')

# IDE knows return type is list[WebElement]
elements = await tab.find(class_name='item', find_all=True)

# IDE knows return type is Optional[WebElement]
maybe_element = await tab.find(id='optional', raise_exc=False)
```

This is critical for IDE autocomplete and type checking. See [Type System Deep Dive](./typing-system.md) for details.

## Selector Resolution Architecture

The mixin converts user input into CDP commands through a resolution pipeline:

| Stage | Input | Output | Key Decision |
|-------|-------|--------|-------------|
| **1. Method Selection** | `find()` kwargs or `query()` expression | Selector strategy | Attribute-based vs expression-based |
| **2. Strategy Resolution** | Attributes or expression | `By` enum + value | Single attr → native method, Multiple → XPath |
| **3. Context Detection** | `By` + value + `hasattr(_object_id)` | CDP command type | Document vs element-relative search |
| **4. Command Generation** | CDP command type + selector | JavaScript + CDP method | `evaluate()` vs `callFunctionOn()` |
| **5. Execution** | CDP command | `objectId` or array of `objectId`s | Via ConnectionHandler |
| **6. WebElement Creation** | `objectId` + attributes | `WebElement` instance(s) | Factory function to avoid circular imports |

### Key Architectural Decisions

**1. Single vs Multiple Attributes**

```python
# Single attribute → Direct selector (fast)
await tab.find(id='username')  # Uses By.ID → getElementById()

# Multiple attributes → XPath (flexible)
await tab.find(tag_name='input', type='password', name='pwd')
# → //input[@type='password' and @name='pwd']
```

**Why this matters:**
- Native methods (`getElementById`, `getElementsByClassName`) are 10-50% faster than XPath
- XPath overhead is acceptable when combining attributes (no alternative)

**2. Auto-Detection of Selector Type**

```python
await tab.query("//div")       # Starts with / → XPath
await tab.query("#login")      # Default → CSS
```

**Implementation:**
```python
if expression.startswith(('./', '/', '(/')):
    return By.XPATH
return By.CSS_SELECTOR
```

Heuristic is **unambiguous** - CSS selectors cannot start with `/`.

**3. XPath Relative Path Adjustment**

For element-relative searches, absolute XPath must be converted:

```python
# User provides: //div
# For WebElement: .//div (relative to element, not document)

def _ensure_relative_xpath(xpath):
    return f'.{xpath}' if not xpath.startswith('.') else xpath
```

Without this, `element.find()` would search from document root.

## CDP Command Generation

The mixin routes to different CDP methods based on search context:

| Context | Selector Type | CDP Method | JavaScript Equivalent |
|---------|--------------|------------|---------------------|
| Document | CSS | `Runtime.evaluate` | `document.querySelector()` |
| Document | XPath | `Runtime.evaluate` | `document.evaluate()` |
| Element | CSS | `Runtime.callFunctionOn` | `this.querySelector()` |
| Element | XPath | `Runtime.callFunctionOn` | `document.evaluate(..., this)` |

**Key insight:** `Runtime.callFunctionOn` requires an `objectId` (the element to call on), while `Runtime.evaluate` executes in global scope.

### JavaScript Templates

Pydoll uses pre-defined templates for consistency and performance:

```python
# CSS selectors
Scripts.QUERY_SELECTOR = 'document.querySelector("{selector}")'
Scripts.RELATIVE_QUERY_SELECTOR = 'this.querySelector("{selector}")'

# XPath expressions
Scripts.FIND_XPATH_ELEMENT = '''
    document.evaluate("{escaped_value}", document, null,
                      XPathResult.FIRST_ORDERED_NODE_TYPE, null).singleNodeValue
'''
```

Templates avoid runtime string concatenation and centralize JavaScript code.

## Object ID Resolution and WebElement Creation

CDP represents DOM nodes as **`objectId` strings**. The mixin abstracts this:

**Single element flow:**
1. Execute CDP command → Extract `objectId` from response
2. Call `DOM.describeNode(objectId)` → Get attributes, tag name
3. Create `WebElement(objectId, connection_handler, attributes)`

**Multiple elements flow:**
1. Execute CDP command → Returns **array as single remote object**
2. Call `Runtime.getProperties(array_objectId)` → Enumerate array indices
3. Extract individual `objectId` for each element
4. Describe and create `WebElement` for each

**Why `Runtime.getProperties`?** CDP doesn't return arrays directly - it returns a **reference to an array object**. We must enumerate its properties to extract individual elements.

## Architectural Insights and Design Tradeoffs

### Why Kwargs Instead of By Enum?

**Pydoll's choice:**
```python
await tab.find(id='submit', class_name='primary')
```

**Selenium's approach:**
```python
driver.find_element(By.ID, 'submit')  # Can't combine attributes
```

**Rationale:**

- **Discoverability**: IDE autocomplete shows all available parameters
- **Composability**: Can combine multiple attributes in one call
- **Readability**: `id='submit'` is more intuitive than `(By.ID, 'submit')`

**Tradeoff:** Kwargs are less explicit about selector strategy. Solved by documentation and logging.

### Why Auto-Detect CSS vs XPath?

The `_get_expression_type()` heuristic eliminates user burden:

```python
await tab.query("//div")       # Auto: XPath
await tab.query("#login")      # Auto: CSS
await tab.query("div > p")     # Auto: CSS
```

**Benefits:**

- **Ergonomics**: Users don't need to specify selector type
- **Correctness**: Impossible to misuse (XPath with CSS method, vice versa)

**Limitation:** No way to force CSS interpretation of ambiguous selectors (rare edge case).

### Circular Import Prevention: create_web_element()

The mixin uses a **factory function** to avoid circular imports:

```python
def create_web_element(*args, **kwargs):
    """Dynamically import WebElement at runtime."""
    from pydoll.elements.web_element import WebElement  # Late import
    return WebElement(*args, **kwargs)
```

**Why needed?**

- `FindElementsMixin` → needs to create `WebElement`
- `WebElement` → inherits from `FindElementsMixin`
- Circular dependency!

**Solution:** Late import inside factory function. Import only executes when function is called, breaking the cycle.

### hasattr() for Context Detection: Elegant or Hacky?

The mixin uses `hasattr(self, '_object_id')` to detect Tab vs WebElement:

```python
if hasattr(self, '_object_id'):
    # WebElement: element-relative search
else:
    # Tab: document-level search
```

**Is this "hacky"?**

- **No**: It's **duck typing** (Pythonic idiom)
- Mixin doesn't need to know class hierarchy
- Both Tab and WebElement provide `_connection_handler`
- WebElement additionally provides `_object_id`

**Alternative approaches:**

1. **Type checking**: `if isinstance(self, WebElement)` → Couples mixin to WebElement
2. **Abstract method**: Requires Tab/WebElement to implement `get_search_context()` → More boilerplate
3. **Dependency injection**: Pass context as parameter → Breaks API ergonomics

**Verdict:** `hasattr()` is the best solution for this use case.

## Key Takeaways

1. **Mixins enable code sharing** without coupling `Tab` and `WebElement` through inheritance
2. **Context detection via duck typing** (`hasattr`) keeps mixin decoupled from class hierarchy
3. **Auto-resolution optimizes performance** by using native methods for single attributes
4. **XPath building provides composability** for multi-attribute queries
5. **Polling-based waiting is simple** but trades CPU cycles for implementation simplicity
6. **CDP object model complexity** is hidden behind WebElement abstraction
7. **Type safety via overloads** provides precise return types for IDE support

## Related Documentation

For deeper understanding of related architectural components:

- **[Type System](./typing-system.md)**: Overload pattern, TypedDict, Generic types
- **[WebElement Domain](./webelement-domain.md)**: WebElement architecture and interaction methods
- **[Selectors Guide](./selectors-guide.md)**: CSS vs XPath syntax and best practices
- **[Tab Domain](./tab-domain.md)**: Tab-level operations and context management

For practical usage patterns:

- **[Element Finding Guide](../features/automation/element-finding.md)**: Practical examples and patterns
- **[Human-Like Interactions](../features/automation/human-interactions.md)**: Realistic element interaction

================================================
FILE: docs/en/deep-dive/architecture/index.md
================================================
# Internal Architecture

**Understand the design, then break the rules intentionally.**

Most documentation shows you **what** a framework does. This section reveals **how** and **why** Pydoll is architected the way it is: the design patterns, architectural decisions, and tradeoffs that shape every line of code.

## Why Architecture Matters

You can use Pydoll effectively without understanding its internal architecture. But when you need to:

- **Debug** complex issues that span multiple components
- **Optimize** performance bottlenecks in large-scale automation
- **Extend** Pydoll with custom functionality
- **Contribute** improvements to the codebase
- **Build** similar tools for different use cases

...architectural knowledge becomes **indispensable**.

!!! quote "Architecture as Language"
    **"Architecture is frozen music."** - Johann Wolfgang von Goethe
    
    Good architecture isn't just about making code work, it's about making code **understandable**, **maintainable**, and **extensible**. Understanding Pydoll's architecture teaches you patterns you'll apply to every project.

## The Six Architectural Domains

Pydoll's architecture is organized into **six cohesive domains**, each with clear responsibilities and interfaces:

### 1. Browser Domain
**[→ Explore Browser Architecture](./browser-domain.md)**

**The orchestrator: managing processes, contexts, and global state.**

The Browser domain sits at the top of the hierarchy, coordinating:

- **Process management**: Launching/terminating browser executables
- **Browser contexts**: Isolated environments (like incognito windows)
- **Tab registry**: Singleton pattern for Tab instances
- **Proxy authentication**: Automatic auth via Fetch domain
- **Global operations**: Downloads, permissions, window management

**Key architectural patterns**:

- **Abstract base class** for Chrome/Edge/other Chromium browsers
- **Manager pattern** (ProcessManager, ProxyManager, TempDirManager)
- **Singleton registry** for Tab instances (prevents duplicates)
- **Context manager protocol** for automatic cleanup

**Critical insight**: The Browser doesn't directly manipulate pages, it **coordinates** lower-level components. This separation of concerns enables multi-browser support and concurrent tab operations.

---

### 2. Tab Domain
**[→ Explore Tab Architecture](./tab-domain.md)**

**The workhorse: executing commands, managing state, coordinating automation.**

The Tab domain is Pydoll's primary interface, handling:

- **Navigation**: Page loading with configurable wait states
- **Element finding**: Delegated to FindElementsMixin
- **JavaScript execution**: Both page and element contexts
- **Event coordination**: Tab-specific event listeners
- **Network monitoring**: Request/response capture and analysis
- **IFrame handling**: Nested context management

**Key architectural patterns**:

- **Façade pattern**: Simplified interface to complex CDP operations
- **Mixin composition**: FindElementsMixin for element location
- **Per-tab WebSocket**: Independent connections for parallelism
- **State flags**: Track enabled domains (network_events_enabled, etc.)
- **Lazy initialization**: Request object created on first access

**Critical insight**: Each Tab owns its **own ConnectionHandler**, enabling true parallel operations across tabs without contention or state leakage.

---

### 3. WebElement Domain
**[→ Explore WebElement Architecture](./webelement-domain.md)**

**The interactor: bridging Python code and DOM elements.**

The WebElement domain represents **individual DOM elements**, providing:

- **Interaction methods**: Click, type, scroll, select
- **Property access**: Text, HTML, bounds, attributes
- **State queries**: Visibility, enabled status, value
- **Screenshots**: Element-specific image capture
- **Child finding**: Relative element location (also via FindElementsMixin)

**Key architectural patterns**:

- **Proxy pattern**: Python object representing remote browser element
- **Object ID abstraction**: CDP's objectId hidden behind Python API
- **Hybrid properties**: Sync (attributes) vs async (dynamic state)
- **Command pattern**: Interaction methods wrap CDP commands
- **Fallback strategies**: Multiple approaches for robustness

**Critical insight**: WebElement maintains **both cached attributes** (from creation) and **dynamic state** (fetched on demand), balancing performance with freshness.

---

### 4. FindElements Mixin
**[→ Explore FindElements Architecture](./find-elements-mixin.md)**

**The locator: translating selectors into DOM queries.**

The FindElementsMixin provides element-finding capabilities to both Tab and WebElement through **composition**, not inheritance:

- **Attribute-based finding**: `find(id='submit', class_name='btn')`
- **Expression-based querying**: `query('div.container > p')`
- **Strategy resolution**: Optimal selector for single vs. multiple attributes
- **Waiting mechanisms**: Polling with configurable timeouts
- **Context detection**: Document vs. element-relative searches

**Key architectural patterns**:
- **Mixin pattern**: Shared capability without inheritance hierarchy
- **Strategy pattern**: Different selector strategies based on input
- **Template method**: Common flow, strategy-specific implementation
- **Factory function**: Late import to avoid circular dependencies
- **Overload pattern**: Type-safe return types (WebElement vs list)

**Critical insight**: The mixin uses **duck typing** (`hasattr(self, '_object_id')`) to detect Tab vs WebElement, enabling code reuse without tight coupling.

---

### 5. Event Architecture
**[→ Explore Event Architecture](./event-architecture.md)**

**The dispatcher: routing browser events to Python callbacks.**

The Event Architecture enables reactive automation through:

- **Event registration**: `on()` method for subscribing to CDP events
- **Callback dispatch**: Async execution without blocking
- **Domain management**: Explicit enable/disable for performance
- **Temporary callbacks**: Auto-removal after first invocation
- **Multi-level scope**: Browser-wide vs tab-specific events

**Key architectural patterns**:

- **Observer pattern**: Subscribe/notify for event-driven code
- **Registry pattern**: Event name → callback list mapping
- **Wrapper pattern**: Auto-wrap sync callbacks for async execution
- **Cleanup protocol**: Automatic callback removal on tab close
- **Scope isolation**: Independent event contexts per tab

**Critical insight**: Events are **push-based** (browser notifies Python), not poll-based, enabling low-latency reactive automation without busy-waiting.

---

### 6. Browser Requests Architecture
**[→ Explore Requests Architecture](./browser-requests-architecture.md)**

**The hybrid: HTTP requests with browser session state.**

The Browser Requests system bridges HTTP and browser automation:

- **Session continuity**: Cookies and auth automatically included
- **Dual data sources**: JavaScript Fetch API + CDP network events
- **Complete metadata**: Headers, cookies, timing (not all available via JavaScript)
- **`requests`-like API**: Familiar interface with browser power

**Key architectural patterns**:

- **Hybrid execution**: JavaScript for body, CDP for metadata
- **Temporary event registration**: Enable/capture/disable pattern
- **Lazy property initialization**: Request object created on first use
- **Adapter pattern**: Requests-compatible interface to browser fetch

**Critical insight**: Browser requests combine **two information sources** (JavaScript and CDP events). JavaScript provides the response body, CDP provides headers and cookies that JavaScript security policies hide.

---

## Architectural Principles

These six domains follow consistent principles:

### 1. Separation of Concerns
Each domain has a **single, well-defined responsibility**:

- Browser → Process/context management
- Tab → Command execution and state
- WebElement → Element interaction
- FindElements → Element location
- Events → Reactive dispatch
- Requests → HTTP in browser context

**Benefit**: Changes in one domain rarely require changes in others.

### 2. Composition Over Inheritance
Instead of deep inheritance hierarchies, Pydoll uses:

- **Mixins** (FindElementsMixin shared by Tab and WebElement)
- **Managers** (ProcessManager, ProxyManager, TempDirManager)
- **Dependency injection** (ConnectionHandler passed to components)

**Benefit**: Flexible component reuse without tight coupling.

### 3. Async by Default
All I/O operations are `async def` and must be `await`ed:

- WebSocket communication
- CDP command execution
- Event callback dispatch
- Network requests

**Benefit**: Enables true concurrency with multiple tabs, parallel operations, and non-blocking I/O.

### 4. Type Safety
Every public API has type annotations:

- Function parameters and return types
- CDP responses as `TypedDict`
- Event types for callback parameters
- Overloads for polymorphic methods

**Benefit**: IDE autocomplete, static type checking, self-documenting code.

### 5. Resource Management
Context managers ensure cleanup:

- `async with Browser()` → closes browser on exit
- `async with tab.expect_file_chooser()` → disables interceptor
- `async with tab.expect_download()` → cleans temp files

**Benefit**: Automatic resource cleanup, prevents leaks even on exceptions.

## Component Interaction

Understanding how domains interact is key:

```mermaid
graph TB
    User[Your Python Code]
    
    User --> Browser[Browser Domain]
    User --> Tab[Tab Domain]
    User --> Element[WebElement Domain]
    
    Browser --> ProcessMgr[Process Manager]
    Browser --> ContextMgr[Context Manager]
    Browser --> TabRegistry[Tab Registry]
    
    Tab --> ConnHandler[Connection Handler]
    Tab --> FindMixin[FindElements Mixin]
    Tab --> EventSystem[Event System]
    Tab --> RequestSystem[Request System]
    
    Element --> ConnHandler2[Connection Handler]
    Element --> FindMixin2[FindElements Mixin]
    
    ConnHandler --> WebSocket[WebSocket to CDP]
    ConnHandler2 --> WebSocket
    EventSystem --> ConnHandler
    RequestSystem --> ConnHandler
    RequestSystem --> EventSystem
    
    WebSocket --> Chrome[Chrome Browser]
```

**Key interactions**:

1. **Browser creates Tabs** → Tabs stored in registry
2. **Tab and WebElement both use FindElementsMixin** → Shared element location
3. **Each Tab owns a ConnectionHandler** → Independent WebSocket connections
4. **Request system uses Event system** → Network events capture metadata
5. **All components use ConnectionHandler** → Centralized CDP communication

## Prerequisites

To fully benefit from this section:

- **[Core Fundamentals](../fundamentals/cdp.md)** - Understand CDP, async, and types
- **Python design patterns** - Familiarity with common patterns
- **OOP concepts** - Classes, inheritance, composition, interfaces
- **Async Python** - Comfortable with `async def` and `await`  

**If you haven't read Fundamentals**, start there first. Architecture builds on those concepts.

## Beyond Architecture

After mastering internal architecture, you'll be ready for:

- **Contributing code**: Understand where new features fit
- **Performance optimization**: Identify bottlenecks and inefficiencies
- **Custom extensions**: Build on Pydoll's patterns
- **Similar tools**: Apply these patterns to other projects

## Philosophy of Design

Good architecture is **invisible**, it shouldn't get in your way. Pydoll's architecture prioritizes:

1. **Simplicity**: Each component does one thing well
2. **Consistency**: Similar operations have similar patterns
3. **Explicitness**: No magic, no hidden behavior
4. **Type safety**: Catch errors at design time, not runtime
5. **Performance**: Async by default, parallelism without locks

These aren't arbitrary choices, they're **battle-tested principles** from decades of software engineering.

---

## Ready to Understand the Design?

Start with **[Browser Domain](./browser-domain.md)** to understand how process management and context isolation work, then progress through the domains in order.

**This is where usage becomes mastery.**

---

!!! success "After Completing Architecture"
    Once you understand these patterns, you'll see them everywhere in software engineering, not just Pydoll. These are **universal patterns** applied to browser automation:
    
    - Façade (Tab simplifies CDP complexity)
    - Observer (Event system for reactive code)
    - Mixin (FindElementsMixin for code reuse)
    - Registry (Browser tracks Tab instances)
    - Strategy (FindElements resolves optimal selectors)
    
    Good architecture is **timeless knowledge**.


================================================
FILE: docs/en/deep-dive/architecture/shadow-dom.md
================================================
# Shadow DOM Architecture

The Shadow DOM is one of the most challenging aspects of modern web automation. Elements inside shadow trees are invisible to regular DOM queries, which breaks traditional automation approaches. This document explains how Shadow DOM works at the browser level, why conventional tools fail with closed shadow roots, and how Pydoll bypasses these restrictions through direct CDP access.

!!! info "Practical Usage Guide"
    For usage examples and quick-start patterns, see the [Element Finding Guide — Shadow DOM section](../../features/element-finding.md#shadow-dom-support).

## What is Shadow DOM?

Shadow DOM is a web standard that enables **DOM encapsulation**. It allows a component to have its own isolated DOM tree (the "shadow tree") attached to a regular DOM element (the "shadow host"). Elements inside a shadow tree are hidden from the main document's queries.

```mermaid
graph TB
    subgraph "Main DOM (Light DOM)"
        Document["document"]
        Host["div#my-component\n(shadow host)"]
        Other["p.normal-content"]
    end

    subgraph "Shadow Tree (Encapsulated)"
        SR["#shadow-root (open)"]
        Style["style"]
        Button["button.internal"]
        Input["input.private"]
    end

    Document --> Host
    Document --> Other
    Host -.->|"attachShadow()"| SR
    SR --> Style
    SR --> Button
    SR --> Input
```

### Shadow Root Modes

When a component creates a shadow root via `attachShadow()`, it specifies a **mode**:

| Mode | JavaScript Access | CDP Access | Common Usage |
|------|-------------------|------------|--------------|
| `open` | `element.shadowRoot` returns the root | Full access via `backendNodeId` | Custom web components (Lit, Stencil) |
| `closed` | `element.shadowRoot` returns `null` | Full access via `backendNodeId` | Security-sensitive components, payment forms |
| `user-agent` | Not accessible via JS | Limited access | Browser-internal UI (input placeholders, video controls) |

This distinction is critical: **JavaScript-level access is restricted by mode, but CDP-level access is not.**

### Why Regular Automation Fails

Traditional automation tools rely on JavaScript execution in the page context:

```javascript
// WebDriver / Selenium approach
document.querySelector('#my-component')        // ✓ Finds the host
document.querySelector('#my-component button') // ✗ Cannot cross shadow boundary
element.shadowRoot                             // ✗ Returns null for closed roots
```

The shadow boundary is enforced by the browser's JavaScript engine. Any automation tool that executes JavaScript to find elements will hit this wall. This includes Selenium, Playwright's `page.evaluate()`, and any tool using `Runtime.evaluate()` with `document.querySelector()` at the document level.

## How Pydoll Bypasses Shadow Boundaries

Pydoll's approach works at a layer **below JavaScript**: the Chrome DevTools Protocol. CDP has direct access to the browser's internal DOM representation, which ignores shadow mode restrictions entirely.

### The CDP Advantage

```mermaid
sequenceDiagram
    participant User as User Code
    participant SR as ShadowRoot
    participant CH as ConnectionHandler
    participant CDP as Chrome CDP
    participant DOM as Browser DOM

    User->>SR: shadow_root.query('.btn')
    SR->>SR: _get_find_element_command(object_id)
    SR->>CH: execute_command(Runtime.callFunctionOn)
    CH->>CDP: WebSocket send
    CDP->>DOM: Execute querySelector on shadow root object
    DOM-->>CDP: Element result
    CDP-->>CH: Response with objectId
    CH-->>SR: Element data
    SR-->>User: WebElement instance
```

The key insight is in **how the shadow root object is obtained** and **how queries are executed against it**:

1. **Discovery**: `DOM.describeNode` with `pierce=true` returns shadow root nodes with their `backendNodeId`, regardless of mode
2. **Resolution**: `DOM.resolveNode` converts a `backendNodeId` to a JavaScript `objectId` that references the shadow root directly
3. **Querying**: `Runtime.callFunctionOn` executes `this.querySelector()` on the shadow root's `objectId`; this works because the call is made **on the shadow root object itself**, not from the document context

### Step-by-Step: Shadow Root Access

```mermaid
flowchart TD
    A["WebElement\n(shadow host)"]
    B["shadowRoots[] with\nbackendNodeId"]
    C["JavaScript objectId\nfor shadow root"]
    D["ShadowRoot instance"]
    E["WebElement\n(inside shadow)"]

    A -->|"DOM.describeNode\ndepth=1, pierce=true"| B
    B -->|"DOM.resolveNode\nbackendNodeId"| C
    C -->|"Create ShadowRoot\nwith objectId"| D
    D -->|"find() / query()\nvia callFunctionOn"| E
```

#### Step 1: Describe the Host Node

```python
# Pydoll sends this CDP command:
{
    "method": "DOM.describeNode",
    "params": {
        "objectId": "<host-element-object-id>",
        "depth": 1,
        "pierce": true  # ← This is the key flag
    }
}
```

The `pierce` parameter tells CDP to traverse shadow boundaries when describing the node. The response includes shadow root information regardless of the shadow root mode:

```json
{
    "result": {
        "node": {
            "nodeName": "DIV",
            "shadowRoots": [
                {
                    "nodeId": 0,
                    "backendNodeId": 5,
                    "shadowRootType": "closed",
                    "childNodeCount": 4
                }
            ]
        }
    }
}
```

!!! warning "nodeId vs backendNodeId"
    When the DOM domain is not explicitly enabled (which is Pydoll's default to minimize overhead), `nodeId` is always `0`. The `backendNodeId` is the stable, always-available identifier. Pydoll uses `backendNodeId` exclusively for shadow root resolution, which is why it works without requiring `DOM.enable()`.

#### Step 2: Resolve to JavaScript Object

```python
# Convert backendNodeId to a usable objectId:
{
    "method": "DOM.resolveNode",
    "params": {
        "backendNodeId": 5
    }
}
```

The response provides an `objectId`, a handle to the shadow root in JavaScript's object space:

```json
{
    "result": {
        "object": {
            "objectId": "-2296764575741119861.1.3"
        }
    }
}
```

#### Step 3: Query Within the Shadow Root

With the shadow root's `objectId`, Pydoll leverages `FindElementsMixin`'s existing relative search mechanism:

```python
# When ShadowRoot.query('.btn') is called:
{
    "method": "Runtime.callFunctionOn",
    "params": {
        "functionDeclaration": "function() { return this.querySelector(\".btn\"); }",
        "objectId": "-2296764575741119861.1.3"
    }
}
```

The function runs with `this` bound to the shadow root object. Since shadow roots implement the `querySelector()` and `querySelectorAll()` interfaces natively, CSS selectors work naturally within the shadow boundary.

## ShadowRoot Architecture

### Design Decision: Reuse FindElementsMixin

The most critical architectural decision was making `ShadowRoot` inherit from `FindElementsMixin`:

```python
class ShadowRoot(FindElementsMixin):
    def __init__(self, object_id, connection_handler, mode, host_element):
        self._object_id = object_id               # Shadow root CDP reference
        self._connection_handler = connection_handler  # For CDP communication
        self._mode = mode                          # ShadowRootType enum
        self._host_element = host_element          # Back-reference to host
```

**Why this works**: `FindElementsMixin._find_element()` checks `hasattr(self, '_object_id')`. When present, it uses `RELATIVE_QUERY_SELECTOR`, which calls `this.querySelector()` on the referenced object. Since shadow roots support `querySelector()` natively, `query()` with CSS selectors works automatically without any shadow-specific code.

```python
# This single line in FindElementsMixin enables shadow root searches:
elif hasattr(self, '_object_id'):
    command = self._get_find_element_command(by, value, self._object_id)
```

`ShadowRoot` inherits `query()` and `find_or_wait_element()` from `FindElementsMixin`. However, `find()` and XPath-based `query()` are explicitly **blocked** on `ShadowRoot` (via the `_css_only` class flag) because shadow roots only support `querySelector()` / `querySelectorAll()` — XPath does not work inside shadow boundaries.

!!! tip "Architectural Consistency"
    This is the same mechanism that makes `WebElement.find()` search within an element's children: the `_object_id` attribute signals "search relative to me" rather than "search the whole document." `ShadowRoot`, `WebElement`, and `Tab` all share element-finding behavior through `FindElementsMixin`, with `ShadowRoot` restricted to CSS selectors only.

### Class Relationships

| Class | Has `_object_id` | Has `_connection_handler` | Find Scope |
|-------|:-:|:-:|---|
| `Tab` | No | Yes | Entire document |
| `WebElement` | Yes | Yes | Within element's subtree |
| `ShadowRoot` | Yes | Yes | Within shadow tree |

All three inherit from `FindElementsMixin`. The presence or absence of `_object_id` determines whether searches are document-global or scoped to a specific node.

### Resolving Shadow Roots: backendNodeId Strategy

Pydoll deliberately uses `backendNodeId` instead of `nodeId` for shadow root resolution:

| Property | `nodeId` | `backendNodeId` |
|----------|----------|-----------------|
| Requires `DOM.enable()` | Yes | No |
| Stable across describe calls | No (0 when DOM not enabled) | Yes |
| Works for shadow root resolution | Only when DOM enabled | Always |
| Performance overhead | Higher (DOM domain tracking) | None |

By relying on `backendNodeId`, Pydoll avoids the overhead of enabling the DOM domain while maintaining reliable shadow root access. This is a pragmatic choice: most automation scenarios don't need the DOM domain's event stream, and enabling it adds memory and processing overhead for tracking every DOM mutation.

## Closed Shadow Roots: Why CDP Access Works

This is the most commonly asked question: **if `element.shadowRoot` returns `null` for closed shadow roots in JavaScript, how can CDP access them?**

The answer lies in understanding the browser's architecture:

```mermaid
graph TB
    subgraph "JavaScript Runtime"
        JS["JavaScript Code"]
        API["Web APIs\n(shadowRoot property)"]
    end

    subgraph "Browser Internals"
        CDP_Layer["CDP Protocol Layer"]
        DOM_Internal["Internal DOM Tree"]
    end

    JS -->|"element.shadowRoot"| API
    API -->|"mode == 'closed'\n→ return null"| JS
    CDP_Layer -->|"DOM.describeNode\npierce=true"| DOM_Internal
    DOM_Internal -->|"Always returns\nfull shadow tree"| CDP_Layer
```

**JavaScript access** goes through the Web API layer, which enforces the shadow mode restriction. When `mode='closed'`, the API returns `null`; this is an intentional access control boundary for web page code.

**CDP access** operates below the Web API layer. It communicates directly with the browser's internal DOM representation. The `closed` mode restriction is a **JavaScript-level policy**, not a **DOM-level restriction**. The shadow tree still exists in the DOM; it's just hidden from JavaScript's view.

!!! info "Security Implications"
    This is by design in the DevTools Protocol. CDP is intended for debugging and automation tools that need full DOM access. The `closed` mode protects shadow contents from other scripts on the same page (e.g., third-party scripts), not from the browser's debugging interface. This is the same reason browser DevTools can inspect closed shadow roots in the Elements panel.

### Practical Verification

You can verify this behavior yourself:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.dom.types import ShadowRootType

async def verify_closed_access():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('about:blank')

        # Create a closed shadow root via JavaScript
        await tab.execute_script("""
            const host = document.createElement('div');
            host.id = 'test-host';
            document.body.appendChild(host);
            const shadow = host.attachShadow({ mode: 'closed' });
            shadow.innerHTML = '<p class="secret">Hidden content</p>';
        """)

        # JavaScript cannot access it:
        result = await tab.execute_script(
            "return document.getElementById('test-host').shadowRoot",
            return_by_value=True,
        )
        js_value = result['result']['result'].get('value')
        print(f"JS shadowRoot: {js_value}")  # None

        # But Pydoll can:
        host = await tab.find(id='test-host')
        shadow = await host.get_shadow_root()
        print(f"Shadow mode: {shadow.mode}")  # ShadowRootType.CLOSED

        secret = await shadow.query('.secret')
        text = await secret.text
        print(f"Content: {text}")  # "Hidden content"

asyncio.run(verify_closed_access())
```

## Nested Shadow Roots

Web components frequently compose other web components, creating multi-level shadow trees:

```mermaid
graph TB
    subgraph "Light DOM"
        Host1["outer-component\n(shadow host)"]
    end

    subgraph "Outer Shadow Tree"
        SR1["#shadow-root (open)"]
        Host2["inner-component\n(shadow host)"]
        P1["p.outer-text"]
    end

    subgraph "Inner Shadow Tree"
        SR2["#shadow-root (closed)"]
        Button["button.deep-btn"]
        P2["p.inner-text"]
    end

    Host1 -.-> SR1
    SR1 --> P1
    SR1 --> Host2
    Host2 -.-> SR2
    SR2 --> P2
    SR2 --> Button
```

Pydoll handles this naturally by chaining `get_shadow_root()` calls. Each `ShadowRoot` produces `WebElement` instances that can themselves have shadow roots:

```python
outer_host = await tab.find(tag_name='outer-component')
outer_shadow = await outer_host.get_shadow_root()        # open

inner_host = await outer_shadow.query('inner-component')
inner_shadow = await inner_host.get_shadow_root()        # closed, still works

deep_button = await inner_shadow.query('.deep-btn')
await deep_button.click()
```

Each level follows the same CDP resolution flow: `describeNode` then `resolveNode` then `ShadowRoot` with `_object_id` then `querySelector` via `callFunctionOn`.

## Shadow Roots Inside IFrames

A common real-world scenario involves shadow roots inside cross-origin iframes — for example, Cloudflare Turnstile captchas. This combines two isolation mechanisms: the iframe boundary and the shadow boundary.

```mermaid
graph TB
    subgraph "Main Page"
        Host["div.widget\n(shadow host)"]
    end

    subgraph "Shadow Tree"
        SR1["#shadow-root"]
        IFrame["iframe\n(cross-origin)"]
    end

    subgraph "IFrame (OOPIF)"
        Body["body"]
    end

    subgraph "IFrame Shadow Tree"
        SR2["#shadow-root"]
        Button["label.checkbox"]
    end

    Host -.-> SR1
    SR1 --> IFrame
    IFrame -.->|"separate process"| Body
    Body -.-> SR2
    SR2 --> Button
```

Pydoll handles this transparently through **iframe context propagation**. When a `ShadowRoot` is created, it inherits the iframe routing context from its host element:

```python
# The full chain: main page → shadow root → iframe → shadow root → element
shadow_host = await tab.find(id='widget-container')
first_shadow = await shadow_host.get_shadow_root()

iframe = await first_shadow.query('iframe')
body = await iframe.find(tag_name='body')
second_shadow = await body.get_shadow_root()

# click() works correctly — mouse events route through the OOPIF session
button = await second_shadow.query('label.checkbox')
await button.click()
```

### How Context Propagation Works

Cross-origin iframes run in a separate browser process (Out-of-Process IFrame, or OOPIF). CDP commands for these iframes must be routed through a dedicated `sessionId`. Pydoll propagates this routing context automatically through the entire chain:

1. **IFrame resolves its context**: `iframe.find()` establishes an `IFrameContext` with `session_id` and `session_handler` for the OOPIF
2. **Child elements inherit context**: Elements found inside the iframe receive the `IFrameContext`
3. **Shadow roots inherit from host**: `ShadowRoot` copies its host element's `_iframe_context`
4. **Elements in shadow inherit from shadow root**: Elements found via `shadow.query()` receive the propagated context
5. **Commands route correctly**: `_execute_command()` detects the inherited context and routes CDP commands (including `Input.dispatchMouseEvent` for `click()`) through the OOPIF session

This means coordinates from `DOM.getBoxModel` (which are relative to the iframe viewport) are correctly paired with mouse events dispatched to the same OOPIF session.

## Finding Shadow Roots: find_shadow_roots()

`Tab.find_shadow_roots()` traverses the entire DOM tree to collect all shadow roots found on the page.

### How It Works

```
Tab.find_shadow_roots()
  ├─ DOM.getDocument(depth=-1, pierce=true)
  │   └─ Returns full DOM tree with shadowRoots arrays
  ├─ Recursive tree walk: _collect_shadow_roots_from_tree()
  │   ├─ Collects shadowRoots entries with host backendNodeId
  │   ├─ Traverses children recursively
  │   └─ Traverses contentDocument (same-origin iframes)
  ├─ For each shadow root entry:
  │   ├─ DOM.resolveNode(backendNodeId) → objectId
  │   └─ Resolve host element (best-effort)
  └─ Returns list[ShadowRoot] with host references
```

### Timeout: Waiting for Shadow Roots

Shadow hosts are often injected asynchronously. `Tab.find_shadow_roots()` accepts a `timeout` parameter that polls every 0.5s until at least one shadow root is found or the timeout expires (raises `WaitElementTimeout`). Similarly, `WebElement.get_shadow_root()` also supports `timeout` for waiting on a specific element's shadow root:

```python
# Wait up to 10 seconds for shadow roots to appear
shadow_roots = await tab.find_shadow_roots(timeout=10)

# Wait for a shadow root on a specific element
shadow = await element.get_shadow_root(timeout=5)
```

### Key Details

- **`pierce=True`** in `DOM.getDocument` causes the browser to include `shadowRoots` arrays in node descriptions, allowing discovery of all shadow roots without navigating to each host individually.
- **Same-origin iframe content** is included in the tree via `contentDocument` nodes. The traversal handles these.
- Each returned `ShadowRoot` has a reference to its `host_element` (resolved best-effort via `DOM.resolveNode`).

### Deep Traversal: Cross-Origin IFrames (OOPIFs)

By default, cross-origin iframes (OOPIFs) are **not** included in the DOM tree — their content lives in a separate browser process. Pass `deep=True` to also discover shadow roots inside OOPIFs:

```python
shadow_roots = await tab.find_shadow_roots(deep=True, timeout=10)
```

When `deep=True` is set, the method performs additional steps:

```
Tab.find_shadow_roots(deep=True)
  ├─ ... (main document traversal as above) ...
  └─ _collect_oopif_shadow_roots()
      ├─ Browser-level ConnectionHandler (no page_id → browser endpoint)
      ├─ Target.getTargets() → filter type='iframe'
      └─ For each iframe target:
          ├─ Target.attachToTarget(targetId, flatten=True) → sessionId
          ├─ DOM.getDocument(depth=-1, pierce=True) with sessionId
          ├─ _collect_shadow_roots_from_tree() on OOPIF DOM
          └─ For each shadow root found:
              ├─ DOM.resolveNode(backendNodeId) with sessionId
              ├─ Resolve host element (best-effort) with sessionId
              ├─ Create IFrameContext(frame_id, session_handler, session_id)
              └─ Set IFrameContext on host element (or ShadowRoot directly)
```

The returned `ShadowRoot` objects carry the OOPIF routing context (`IFrameContext`), so elements found via `shadow_root.query()` will automatically route CDP commands through the correct OOPIF session. This is critical for scenarios like Cloudflare Turnstile captchas, where the checkbox lives inside a closed shadow root within a cross-origin iframe.

## Limitations and Edge Cases

### Selector Strategies Inside Shadow Roots

!!! warning "CSS Selectors Only Inside Shadow Roots"
    `find()` and XPath are **not supported** on `ShadowRoot` and will raise `NotImplementedError`. Always use `query()` with CSS selectors to search inside shadow roots.

Shadow roots natively implement `querySelector()` and `querySelectorAll()`, but **not** XPath evaluation. Pydoll enforces this by blocking `find()` (which may generate XPath internally) and XPath-based `query()` on `ShadowRoot`:

| Method | Inside Shadow Root | Notes |
|--------|:--:|---|
| `query('css-selector')` | Supported | The only supported approach |
| `find(...)` | Not supported | Raises `NotImplementedError` |
| `query('//xpath')` | Not supported | Raises `NotImplementedError` |

```python
shadow = await host.get_shadow_root()

# Supported: query() with CSS selectors
button = await shadow.query('button.submit')
email = await shadow.query('#email-input')
items = await shadow.query('.item', find_all=True)

# Not supported: find() and XPath raise NotImplementedError
# shadow.find(id='email-input')       # NotImplementedError
# shadow.query('.//button')            # NotImplementedError
```

### XPath Cannot Cross Shadow Boundaries

XPath expressions from the document root cannot traverse shadow boundaries. This is a fundamental limitation of XPath, which was designed before Shadow DOM existed:

```python
# Won't find shadow content: document-level XPath cannot cross the boundary
element = await tab.find(xpath='//div[@id="host"]//button')
```

### User-Agent Shadow Roots

Browser-internal shadow roots (e.g., `<input>` placeholder styling, `<video>` controls) are of type `user-agent`. These are accessible via CDP but their internal structure varies across browser versions and is not part of any web standard.

```python
input_element = await tab.find(tag_name='input')
try:
    ua_shadow = await input_element.get_shadow_root()
    # ua_shadow.mode == ShadowRootType.USER_AGENT
    # Internal structure is browser-specific
except ShadowRootNotFound:
    pass  # Not all inputs have user-agent shadow roots
```

!!! warning "User-Agent Shadow Root Stability"
    Do not build automation logic that depends on the internal structure of user-agent shadow roots. Their DOM structure is an implementation detail that can change between browser versions without notice.

### Stale Shadow Root References

If the host element is removed from the DOM and re-added (common in single-page applications), the shadow root's `objectId` becomes stale. The solution is to re-acquire the shadow root:

```python
# After a page navigation or DOM rebuild:
host = await tab.find(id='my-component', timeout=5)  # Re-find the host
shadow = await host.get_shadow_root()                 # Fresh shadow root
```

## Key Takeaways

- **Shadow DOM encapsulation** hides elements from document-level `querySelector()`, breaking traditional automation
- **CDP operates below the JavaScript API layer**, bypassing shadow mode restrictions entirely
- **`backendNodeId`** is the stable identifier used for shadow root resolution, avoiding the need to enable the DOM domain
- **`ShadowRoot` inherits `FindElementsMixin`**, gaining `query()` with CSS selectors through the `_object_id` mechanism (`find()` and XPath are blocked)
- **Closed shadow roots** are fully accessible because the `closed` mode is a JavaScript-level policy, not a DOM-level restriction
- **Nested shadow roots** work naturally by chaining `get_shadow_root()` calls at each level
- **Shadow roots inside iframes** work transparently through automatic iframe context propagation
- **Use `query()` with CSS selectors** inside shadow roots; `find()` and XPath raise `NotImplementedError`
- **`find_shadow_roots()`** discovers all shadow roots on the page; supports `timeout` for polling and `deep=True` for cross-origin iframes (OOPIFs)
- **`get_shadow_root(timeout)`** waits for a shadow root to appear on a specific element

## Related Documentation

- **[Element Finding Guide](../../features/element-finding.md)**: Practical usage of `find()`, `query()`, and shadow root access
- **[IFrames & Contexts](../fundamentals/iframes-and-contexts.md)**: How Pydoll resolves and routes commands to iframes, including OOPIF handling
- **[FindElements Mixin Architecture](./find-elements-mixin.md)**: How the `_object_id` mechanism enables scoped searches
- **[WebElement Domain](./webelement-domain.md)**: How elements interact with CDP
- **[Connection Layer](../fundamentals/connection-layer.md)**: WebSocket communication with the browser


================================================
FILE: docs/en/deep-dive/architecture/tab-domain.md
================================================
# Tab Domain Architecture

The Tab domain is Pydoll's primary interface for browser automation, acting as an orchestration layer that integrates multiple CDP domains into a cohesive API. This document explores its internal architecture, design patterns, and the engineering decisions that shape its behavior.

!!! info "Practical Usage"
    For usage examples and practical patterns, see the [Tab Management Guide](../features/automation/tabs.md).

## Architectural Overview

The `Tab` class serves as a **façade** over Chrome DevTools Protocol, abstracting the complexity of multi-domain coordination into a unified interface.

### Component Structure

| Component | Relationship | Purpose |
|-----------|-------------|---------|
| **Tab** | Core class | Primary automation interface |
| ↳ **ConnectionHandler** | Composition (owned) | WebSocket communication with CDP |
| ↳ **Browser** | Reference (parent) | Access to browser-level state and configuration |
| ↳ **FindElementsMixin** | Inheritance | Element location capabilities |
| ↳ **WebElement** | Factory (creates) | Individual DOM element representations |

### CDP Domain Integration

The `ConnectionHandler` routes Tab operations to multiple CDP domains:

```
Tab Methods                CDP Domain          Purpose
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
go_to(), refresh()     →   Page            →  Navigation & lifecycle
execute_script()       →   Runtime         →  JavaScript execution
find(), query()        →   Runtime/DOM     →  Element location
get_cookies()          →   Storage         →  Session state
enable_network_events()→   Network         →  Traffic monitoring
enable_fetch_events()  →   Fetch           →  Request interception
```

### Core Responsibilities

1. **CDP Command Routing**: Translates high-level operations into domain-specific CDP commands
2. **State Management**: Tracks enabled domains, active callbacks, and session state
3. **Event Coordination**: Bridges CDP events to user-defined callbacks
4. **Element Factory**: Creates `WebElement` instances from CDP `objectId` strings
5. **Lifecycle Management**: Handles cleanup and resource deallocation

## Composition vs Inheritance: The FindElementsMixin

A key architectural decision in the Tab domain is **inheriting from `FindElementsMixin`** rather than using composition:

```python
class Tab(FindElementsMixin):
    def __init__(self, ...):
        self._connection_handler = ConnectionHandler(...)
        # Mixin methods now available on Tab
```

**Why inheritance here?**

| Approach | Pros | Cons | Pydoll's Choice |
|----------|------|------|-----------------|
| **Inheritance** | Clean API (`tab.find()`), type compatibility | Tight coupling | Used |
| Composition | Loose coupling, flexible | Verbose (`tab.finder.find()`), wrapper overhead | Not used |

**Rationale:** The mixin pattern is justified because:

- Element finding is **core to Tab identity** (every tab can find elements)
- The mixin is **stateless** - it only requires `_connection_handler` (dependency injection via duck typing)
- API ergonomics matter - `tab.find()` is more intuitive than `tab.elements.find()`

See [FindElements Mixin Deep Dive](./find-elements-mixin.md) for architectural details.

## State Management Architecture

The Tab class manages **multiple layers of state**:

###  1. Domain Enablement Flags

```python
class Tab:
    def __init__(self, ...):
        self._page_events_enabled = False
        self._network_events_enabled = False
        self._fetch_events_enabled = False
        self._dom_events_enabled = False
        self._runtime_events_enabled = False
        self._intercept_file_chooser_dialog_enabled = False
```

**Why explicit flags?**

- **Idempotency**: Calling `enable_page_events()` twice doesn't double-register
- **State inspection**: Properties like `tab.page_events_enabled` expose current state
- **Cleanup tracking**: Know which domains need disabling on tab close

**Alternative (not used):** Query CDP for enabled domains on each check → Too slow, adds latency.

### 2. Target Identity

```python
self._target_id: str              # Unique CDP identifier
self._browser_context_id: Optional[str]  # Isolation context
self._connection_port: int        # WebSocket port
```

**Design decision:** `target_id` is the **primary identifier**, not the Tab instance itself. This enables:

- **Browser-level Tab registry**: `Browser._tabs_opened[target_id] = tab`
- **Singleton pattern**: Same `target_id` always returns same `Tab` instance
- **Connection reuse**: Multiple operations on same tab share WebSocket

### 3. Feature-Specific State

```python
self._cloudflare_captcha_callback_id: Optional[int] = None  # For cleanup
self._request: Optional[Request] = None  # Lazy initialization
```

**Lazy initialization pattern:** `Request` is only created when `tab.request` is accessed:

```python
@property
def request(self) -> Request:
    if self._request is None:
        self._request = Request(self)
    return self._request
```

**Why lazy?** Most automations don't use browser-context HTTP requests. Saves memory and initialization time.


## JavaScript Execution: Dual Context Architecture

The `execute_script()` method implements **context polymorphism** - same interface, different CDP commands:

| Context | CDP Method | Use Case |
|---------|-----------|----------|
| Global (no element) | `Runtime.evaluate` | `document.title`, global scripts |
| Element-bound | `Runtime.callFunctionOn` | Element-specific operations |

**Key architectural decision:** Auto-detect execution mode based on `element` parameter presence, eliminating separate APIs (`evaluate()` vs `call_function_on()`).

**Script transformation pipeline:**

1. Replace `argument` → `this` (Selenium compatibility)
2. Detect if script is already wrapped in `function() { }`
3. Wrap if needed: `script` → `function() { script }`
4. Route to appropriate CDP command

**Why `argument` keyword?** Migration path for Selenium users, API familiarity.

!!! info "Practical Usage"
    See [Human-Like Interactions](../features/automation/human-interactions.md) for real-world script execution patterns.

## Event System Integration

The Tab acts as a **thin wrapper** over ConnectionHandler's event system, but adds an important layer: **non-blocking callback execution**.

```python
async def on(self, event_name: str, callback: Callable, temporary: bool = False) -> int:
    # Wrap async callbacks to execute in background
    async def callback_wrapper(event):
        asyncio.create_task(callback(event))
    
    if asyncio.iscoroutinefunction(callback):
        function_to_register = callback_wrapper  # Non-blocking wrapper
    else:
        function_to_register = callback  # Sync callbacks execute directly
    
    # Delegate registration to ConnectionHandler
    return await self._connection_handler.register_callback(
        event_name, function_to_register, temporary
    )
```

**Architectural role:** Tab provides tab-scoped event registration with non-blocking execution semantics, while ConnectionHandler handles WebSocket plumbing and sequential callback invocation.

**Key features:**

- **Background execution** via `asyncio.create_task()` for async callbacks (fire-and-forget)
- **Sync/async callback auto-detection**
- **Temporary callbacks** for one-shot handlers
- **Callback ID** for explicit removal

**Execution model:**

| Layer | Behavior | Purpose |
|-------|----------|---------|
| **User callback** | Runs in background task | Never blocks other callbacks or CDP commands |
| **Tab wrapper** | `create_task(callback())` | Launches background task, returns immediately |
| **EventsManager** | `await wrapper()` | Sequentially invokes wrappers for the same event |

**Why the wrapper?** Without it, a slow async callback would block other callbacks for the same event. The `create_task` wrapper ensures all callbacks start "simultaneously" (in separate tasks), preventing one slow callback from delaying others.

!!! info "Detailed Architecture"
    See [Event Architecture Deep Dive](./event-architecture.md) for internal event routing mechanisms and EventsManager's sequential invocation pattern.
    
    **Practical usage:** [Event System Guide](../features/advanced/event-system.md)

## Session State: Cookie Management

**Architectural separation:** Cookies route to **Storage domain** (manipulation), not Network domain (observation).

```python
async def set_cookies(self, cookies: list[CookieParam]):
    return await self._execute_command(
        StorageCommands.set_cookies(cookies, self._browser_context_id)
    )
```

**Context-aware design:** `browser_context_id` parameter ensures cookie isolation, enabling multi-account automation.

!!! info "Practical Cookie Management"
    See [Cookies & Sessions Guide](../features/browser-management/cookies-sessions.md) for usage patterns and anti-detection strategies.

## Content Capture: CDP Target Restrictions

**Critical limitation:** `Page.captureScreenshot` only works on **top-level targets**. Iframe tabs fail silently (no `data` field in response).

```python
try:
    screenshot_data = response['result']['data']
except KeyError:
    raise TopLevelTargetRequired(...)  # Guide users to WebElement.take_screenshot()
```

**Design implication:** Historically, Pydoll created dedicated Tab instances for iframes. The new model keeps iframe interaction inside `WebElement`, so screenshots and other helpers should target elements within the frame (for example, `await iframe_element.find(...).take_screenshot()`).

**PDF Generation:** `Page.printToPDF` returns base64-encoded data. Pydoll abstracts file I/O, but underlying data is always base64 (CDP spec).

!!! info "Practical Usage"
    See [Screenshots & PDFs Guide](../features/automation/screenshots-and-pdfs.md) for parameters, formats, and real-world examples.

## Network Monitoring: Stateful Design

**Architectural principle:** Network methods require **enabled state** - runtime checks prevent accessing nonexistent data.

**Storage separation:**

- **Logs**: Buffered in `ConnectionHandler` (receives all CDP events)
- **Tab**: Queries handler, no duplicate storage
- **Response bodies**: Retrieved on-demand via `Network.getResponseBody(requestId)`

**Critical timing constraint:** Response bodies must be fetched **within ~30s** after response (browser garbage collection).

!!! info "Network Monitoring in Practice"
    See [Network Monitoring Guide](../features/network/monitoring.md) for comprehensive event tracking and analysis patterns.
    
    **Request interception:** [Request Interception Guide](../features/network/interception.md)

## Dialog Management: Event Capture Pattern

**Critical CDP behavior:** JavaScript dialogs **block all CDP commands** until handled.

**Architectural solution:** `ConnectionHandler` captures `Page.javascriptDialogOpening` events immediately, preventing automation hangs.

```python
# Handler stores dialog event before user code runs
self._connection_handler.dialog  # Captured by handler
# Tab queries stored event
async def has_dialog(self) -> bool:
    return bool(self._connection_handler.dialog)
```

**Why this design?** Event fires before user callbacks execute. Without immediate capture, automation would deadlock waiting for blocked CDP responses.

## IFrame Architecture: Tab Reuse Pattern

**Key insight:** IFrames are **first-class CDP targets** → Represented as `Tab` instances.

**Target resolution algorithm:**

1. Extract `src` attribute from iframe element
2. Query all CDP targets via `Target.getTargets()`
3. Match iframe URL to target `targetId`
4. Check singleton registry (`Browser._tabs_opened`)
5. Return existing instance or create + register new Tab

**Design tradeoff:** IFrame tabs inherit all Tab methods, but some fail (e.g., `take_screenshot()`). Alternative (dedicated `IFrame` class) would duplicate 90% of API for minimal benefit.

!!! info "Working with IFrames"
    See [IFrame Interaction Guide](../features/automation/iframes.md) for practical patterns, nested frames, and common pitfalls.

## Context Managers: Automatic Resource Cleanup

**Architectural pattern:** State restoration + optimistic resource acquisition.

### Key Context Managers

| Manager | Pattern | Key Feature |
|---------|---------|-------------|
| `expect_file_chooser()` | State restoration | Restores domain enablement after exit |
| `expect_download()` | Temporary resources | Auto-cleanup temp directories |

**File Chooser Design:**

- Enable required domains (`Page`, file chooser interception)
- Register **temporary callback** (auto-removes after first fire)
- Restore original state on exit (if domains were disabled before, disable again)

**Download Handling Design:**

- Create temporary directory (or use provided path)
- Use `asyncio.Future` for coordination (`will_begin_future`, `done_future`)
- Browser-level configuration (downloads are per-context, not per-tab)
- Guaranteed cleanup via `finally` block

!!! info "Practical File Operations"
    See [File Operations Guide](../features/automation/file-operations.md) for upload patterns, file chooser usage, and download handling.

## Lifecycle: Tab Closure and Invalidation

**Tab closure cascade:**

1. CDP closes browser tab (`Page.close`)
2. Tab unregisters from `Browser._tabs_opened`
3. WebSocket auto-closes (CDP target destroyed)
4. Event callbacks garbage-collected

**Post-closure behavior:** Tab instance becomes **invalid** - further operations fail (closed WebSocket).

**Design decision:** No explicit `_closed` flag. Users manage lifecycle. Alternative (state tracking) adds overhead for marginal safety benefit.

## Key Architectural Decisions

### Per-Tab WebSocket Strategy

**Chosen design:** Each Tab creates its own ConnectionHandler with a dedicated WebSocket connection to `ws://localhost:port/devtools/page/{targetId}`.

**Rationale:**

CDP supports **two connection models**:

1. **Browser-level**: Single connection to `ws://localhost:port/devtools/browser/...` (used by Browser instance)
2. **Tab-level**: Per-tab connections to `ws://localhost:port/devtools/page/{targetId}` (used by Tab instances)

Pydoll uses **both**:

- **Browser** has its own ConnectionHandler for browser-wide operations (contexts, downloads, browser-level events)
- **Each Tab** has its own ConnectionHandler for tab-specific operations (navigation, element finding, tab events)

**Benefits of per-tab WebSockets:**

- **True parallelism**: Multiple tabs can execute CDP commands simultaneously without waiting
- **Independent event streams**: Each tab receives only its own events (no filtering needed)
- **Isolated failures**: Connection issues in one tab don't affect others
- **Simplified routing**: No need to demultiplex messages by targetId

**Tradeoff:** More open connections (one per tab), but CDP and browsers handle this efficiently. For 10 tabs, this is 11 connections total (1 browser + 10 tabs), which is negligible compared to the HTTP connections the tabs themselves create.

!!! info "Browser vs Tab Communication"
    See [Browser Domain Architecture](./browser-domain.md) for details on the browser-level ConnectionHandler and how Browser/Tab coordination works.

### Browser Reference Necessity

**Why Tab stores `_browser` reference:**
- Context queries (`browser_context_id` for cookies)
- Browser-level operations (download behavior, iframe registry)
- Configuration access (`browser.options.page_load_state`)

### API Design Choices

| Choice | Rationale |
|--------|-----------|
| **Async properties** (`current_url`, `page_source`) | Signal live data + CDP cost |
| **Separate `enable`/`disable` methods** | Explicit over implicit, matches CDP naming |
| **No `_closed` flag** | Users manage lifecycle, reduces overhead |
| **`argument` keyword in scripts** | Selenium compatibility, migration path |

## Relationship to Other Domains

The Tab domain sits at the **center** of Pydoll's architecture:

```mermaid
graph TD
    Browser[Browser Domain<br/>Lifecycle & Process] -->|creates| Tab[Tab Domain<br/>Automation Interface]
    Tab -->|uses| ConnectionHandler[ConnectionHandler<br/>CDP Communication]
    Tab -->|creates| WebElement[WebElement Domain<br/>Element Interaction]
    Tab -->|inherits| FindMixin[FindElementsMixin<br/>Locator Strategies]
    Tab -->|uses| Commands[CDP Commands<br/>Typed Protocol]
    
    ConnectionHandler -->|dispatches| Events[Event System]
    Tab -.->|references| Browser
    WebElement -.->|references| ConnectionHandler
```

**Key relationships:**

1. **Browser → Tab**: Parent-child. Browser manages Tab lifecycle and shared state.
2. **Tab → ConnectionHandler**: Composition. Tab delegates CDP communication.
3. **Tab → WebElement**: Factory. Tab creates elements from `objectId` strings.
4. **Tab ← FindElementsMixin**: Inheritance. Tab gains element location methods.
5. **Tab ↔ Browser**: Bidirectional reference. Tab queries browser for context info.

## Summary: Design Philosophy

The Tab domain prioritizes **API ergonomics** and **correctness** over micro-optimizations:

- **Façade pattern** abstracts CDP complexity
- **State management** via explicit flags prevents double-enabling
- **Resource management** through context managers
- **Event coordination** with background execution (non-blocking)

**Core tradeoffs:**

| Decision | Benefit | Cost | Verdict |
|----------|---------|------|---------|
| Per-tab WebSocket | True parallelism | More connections | Justified |
| Inherit FindElementsMixin | Clean API | Tight coupling | Justified |
| Lazy Request init | Memory efficiency | Property overhead | Justified |

## Further Reading

**Practical guides:**

- [Tab Management](../features/automation/tabs.md) - Multi-tab patterns, lifecycle, concurrency
- [Element Finding](../features/element-finding.md) - Selectors and DOM traversal
- [Event System](../features/advanced/event-system.md) - Real-time browser monitoring

**Architectural deep-dives:**

- [Event Architecture](./event-architecture.md) - WebSocket plumbing and event routing
- [FindElements Mixin](./find-elements-mixin.md) - Selector resolution algorithms
- [Browser Domain](./browser-domain.md) - Process management and contexts


================================================
FILE: docs/en/deep-dive/architecture/webelement-domain.md
================================================
# WebElement Domain Architecture

The WebElement domain bridges high-level automation code and low-level DOM interaction through Chrome DevTools Protocol. This document explores its internal architecture, design patterns, and engineering decisions.

!!! info "Practical Usage"
    For usage examples and interaction patterns, see:
    
    - [Element Finding Guide](../features/element-finding.md)
    - [Human-Like Interactions](../features/automation/human-interactions.md)
    - [File Operations](../features/automation/file-operations.md)

## Architectural Overview

WebElement represents a **remote object reference** to a DOM element via CDP's `objectId` mechanism:

```
User Code → WebElement → ConnectionHandler → CDP Runtime → Browser DOM
```

**Key characteristics:**

- **Async by design**: All operations follow Python's async/await pattern
- **Remote reference**: Maintains CDP `objectId` for browser-side element
- **Mixin inheritance**: Inherits `FindElementsMixin` for child element searches
- **Hybrid state**: Combines cached attributes with live DOM queries

### Core State

```python
class WebElement(FindElementsMixin):
    def __init__(self, object_id: str, connection_handler: ConnectionHandler, ...):
        self._object_id = object_id              # CDP remote object reference
        self._connection_handler = connection_handler  # WebSocket communication
        self._attributes: dict[str, str] = {}    # Cached HTML attributes
        self._search_method = method             # How element was found (debug)
        self._selector = selector                # Original selector (debug)
```

**Why cache attributes?** Initial element location returns HTML attributes. Caching provides fast, synchronous access to common properties (`id`, `class`, `tag_name`) without additional CDP calls.

## Design Patterns

### 1. Command Pattern

All element interactions translate to CDP commands:

| User Operation | CDP Domain | Command |
|----------------|-----------|---------|
| `element.click()` | Input | `Input.dispatchMouseEvent` |
| `element.text` | Runtime | `Runtime.callFunctionOn` |
| `element.bounds` | DOM | `DOM.getBoxModel` |
| `element.take_screenshot()` | Page | `Page.captureScreenshot` |

### 2. Bridge Pattern

WebElement abstracts CDP protocol complexity:

```python
async def click(self, x_offset=0, y_offset=0, hold_time=0.1):
    # High-level API
    
    # → Translates to low-level CDP commands:
    # 1. DOM.getBoxModel (get position)
    # 2. Input.dispatchMouseEvent (press)
    # 3. Input.dispatchMouseEvent (release)
```

### 3. Mixin Inheritance for Child Searches

**Why inherit FindElementsMixin?** Enables element-relative searches:

```python
form = await tab.find(id='login-form')
username = await form.find(name='username')  # Search within form
```

**Design decision:** Composition (`form.finder.find()`) would be more flexible but less ergonomic. Inheritance chosen for API simplicity.

## Hybrid Property System

**Architectural innovation:** WebElement combines sync and async property access.

### Synchronous Properties (Cached Attributes)

```python
@property
def id(self) -> str:
    return self._attributes.get('id')  # From cached HTML attributes

@property  
def class_name(self) -> str:
    return self._attributes.get('class_name')  # 'class' → 'class_name' (Python keyword)
```

**Source:** Flat list from CDP element location response, parsed during `__init__`.

### Asynchronous Properties (Live DOM State)

```python
@property
async def text(self) -> str:
    outer_html = await self.inner_html  # CDP call
    soup = BeautifulSoup(outer_html, 'html.parser')
    return soup.get_text(strip=True)

@property
async def bounds(self) -> dict:
    response = await self._execute_command(DomCommands.get_box_model(self._object_id))
    # Parse and return bounds
```

**Rationale:** Text and bounds are **dynamic** - they change as page updates. Attributes are **static** - captured at location time.

| Property Type | Access | Source | Use Case |
|--------------|--------|--------|----------|
| Sync | `element.id` | Cached attributes | Fast access, static data |
| Async | `await element.text` | Live CDP query | Current state, dynamic data |

## Click Implementation: Multi-Stage Pipeline

Click operations follow a sophisticated pipeline to ensure reliability:

### 1. Special Element Detection

```python
async def click(self, x_offset=0, y_offset=0, hold_time=0.1):
    # Stage 1: Handle special elements
    if self._is_option_tag():
        return await self.click_option_tag()  # <option> needs JavaScript select
```

**Why special handling?** `<option>` elements inside `<select>` don't respond to mouse events. Requires JavaScript `selected = true`.

### 2. Visibility Check

```python
    # Stage 2: Verify element is visible
    if not await self.is_visible():
        raise ElementNotVisible()
```

**Why check?** CDP mouse events target coordinates. Hidden elements would receive clicks at wrong positions or fail silently.

### 3. Position Calculation

```python
    # Stage 3: Scroll into view and get position
    await self.scroll_into_view()
    bounds = await self.bounds
    
    # Stage 4: Calculate click coordinates
    position_to_click = (
        bounds['x'] + bounds['width'] / 2 + x_offset,
        bounds['y'] + bounds['height'] / 2 + y_offset,
    )
```

**Offset support:** Enables varied click positions for human-like behavior (anti-detection).

### 4. Mouse Event Dispatch

```python
    # Stage 5: Send CDP mouse events
    await self._execute_command(InputCommands.mouse_press(*position_to_click))
    await asyncio.sleep(hold_time)  # Configurable hold (default 0.1s)
    await self._execute_command(InputCommands.mouse_release(*position_to_click))
```

**Why two commands?** Simulates real mouse behavior (press → hold → release). Some sites detect instant clicks as bots.

### Click Fallback: JavaScript Alternative

```python
async def click_using_js(self):
    """Fallback for elements that can't be clicked via mouse events."""
    await self.execute_script('this.click()')
```

**When to use:**
- Hidden elements (e.g., file inputs styled with CSS)
- Elements behind overlays
- Performance-critical scenarios (skips visibility/position checks)

!!! info "Mouse vs JavaScript Clicks"
    See [Human-Like Interactions](../features/automation/human-interactions.md) for when to use each approach and detection implications.

## Screenshot Architecture: Clip Regions

**Key mechanism:** `Page.captureScreenshot` with `clip` parameter.

```python
async def take_screenshot(self, path: str, quality: int = 100):
    # 1. Get element bounds (position + dimensions)
    bounds = await self.get_bounds_using_js()
    
    # 2. Create clip region
    clip = Viewport(x=bounds['x'], y=bounds['y'], 
                    width=bounds['width'], height=bounds['height'], scale=1)
    
    # 3. Capture only clipped region
    screenshot = await self._execute_command(
        PageCommands.capture_screenshot(format=ScreenshotFormat.JPEG, clip=clip, quality=quality)
    )
```

**Why JavaScript bounds?** `DOM.getBoxModel` can fail for certain elements. JavaScript `getBoundingClientRect()` is more reliable fallback.

**Format limitation:** Element screenshots always use JPEG (CDP restriction with clip regions).

!!! info "Screenshot Capabilities"
    See [Screenshots & PDFs](../features/automation/screenshots-and-pdfs.md) for full-page vs element screenshots comparison.

## JavaScript Execution Context

**Critical CDP feature:** `Runtime.callFunctionOn(objectId, ...)` executes JavaScript **in element context** (`this` = element).

```python
async def execute_script(self, script: str, return_by_value=False):
    return await self._execute_command(
        RuntimeCommands.call_function_on(self._object_id, script, return_by_value)
    )
```

**Use cases:**

- Visibility checks: `await element.is_visible()` → JavaScript checks computed styles
- Style manipulation: `await element.execute_script("this.style.border = '2px solid red'")`
- Attribute access: Some properties require JavaScript (e.g., `value` for inputs)

**Alternative (not used):** Execute global script with element selector → Slower, risks stale references.

## State Verification Pipeline

**Reliability strategy:** Pre-check element state before interactions to prevent failures.

| Check | Purpose | Implementation |
|-------|---------|----------------|
| `is_visible()` | Element in viewport, not hidden | JavaScript: `offsetWidth > 0 && offsetHeight > 0` |
| `is_on_top()` | No overlays blocking element | JavaScript: `document.elementFromPoint(x, y) === this` |
| `is_interactable()` | Visible + on top | Combines both checks |

**Why JavaScript for visibility?** CSS `display: none`, `visibility: hidden`, `opacity: 0` all affect visibility differently. JavaScript provides unified check.

## Performance Strategies

### 1. Operation-Specific Optimization

**Principle:** Choose the fastest approach for each operation type.

| Operation | Primary Approach | Rationale |
|-----------|-----------------|-----------|
| Text extraction | BeautifulSoup parsing | More accurate than JavaScript `innerText` |
| Visibility check | JavaScript | Single CDP call vs multiple DOM queries |
| Click | CDP mouse events | Most realistic, required for anti-detection |
| Bounds | `DOM.getBoxModel` | Faster than JavaScript, with JS fallback |

### 2. Local Computation

**Minimize CDP round-trips** by computing locally when possible:

```python
# Good: Single bounds query, local calculation
bounds = await element.bounds
click_x = bounds['x'] + bounds['width'] / 2 + offset_x
click_y = bounds['y'] + bounds['height'] / 2 + offset_y

# Bad: Multiple CDP calls for simple math
click_x = await element.execute_script('return this.offsetLeft + this.offsetWidth / 2')
click_y = await element.execute_script('return this.offsetTop + this.offsetHeight / 2')
```

### 3. Cached Attributes

**Design decision:** Cache static attributes at creation time:

```python
# Fast synchronous access (no CDP call)
element_id = element.id
element_class = element.class_name
```

**Tradeoff:** Attributes won't reflect runtime changes. For dynamic properties, use async: `await element.text`.

## Key Architectural Decisions

| Decision | Rationale |
|----------|-----------|
| **Inherit FindElementsMixin** | Enables child searches, maintains API consistency |
| **Hybrid sync/async properties** | Balances performance (sync) with freshness (async) |
| **JavaScript fallbacks** | Reliability over performance for critical operations |
| **Special element detection** | `<option>`, `<input type="file">` require unique handling |
| **Pre-click visibility checks** | Fail fast with clear errors vs silent failures |

## Summary

The WebElement domain bridges Python automation code and browser DOM through:

- **Remote object references** via CDP `objectId`
- **Hybrid property system** balancing sync attributes and async state
- **Multi-stage interaction pipelines** ensuring reliability
- **Specialized handling** for element type variations

**Core tradeoffs:**

| Decision | Benefit | Cost | Verdict |
|----------|---------|------|---------|
| Mixin inheritance | Clean API | Tight coupling | Justified |
| Cached attributes | Fast sync access | Stale data risk | Justified |
| JavaScript fallbacks | Reliability | Performance hit | Justified |
| Visibility pre-checks | Clear errors | Extra CDP calls | Justified |

## Further Reading

**Practical guides:**

- [Element Finding](../features/element-finding.md) - Locating elements, selectors
- [Human-Like Interactions](../features/automation/human-interactions.md) - Clicking, typing, realism
- [File Operations](../features/automation/file-operations.md) - File uploads and downloads

**Architectural deep-dives:**

- [FindElements Mixin](./find-elements-mixin.md) - Selector resolution pipeline
- [Tab Domain](./tab-domain.md) - Tab as element factory
- [Connection Layer](./connection-layer.md) - WebSocket communication 

================================================
FILE: docs/en/deep-dive/fingerprinting/behavioral-fingerprinting.md
================================================
# Behavioral Fingerprinting

Behavioral fingerprinting analyzes how users interact with web applications rather than what tools they use. While network and browser fingerprints can be spoofed by setting the right values, human behavior follows biomechanical patterns that are difficult to replicate convincingly. Detection systems collect mouse movements, keystroke timing, scroll behavior, and interaction sequences, then use statistical models to distinguish humans from automation.

This document covers the detection techniques, the science behind them, and how Pydoll's humanization features address each vector.

!!! info "Module Navigation"
    - [Network Fingerprinting](./network-fingerprinting.md): TCP/IP, TLS, HTTP/2 protocol fingerprinting
    - [Browser Fingerprinting](./browser-fingerprinting.md): Canvas, WebGL, navigator properties
    - [Evasion Techniques](./evasion-techniques.md): Practical countermeasures

## Mouse Movement Analysis

Mouse movement is one of the most powerful behavioral indicators because human motor control follows biomechanical laws that simple automation cannot replicate. Detection systems collect `mousemove` events (each containing x, y coordinates and a timestamp) and analyze the trajectory for properties that distinguish organic movement from programmatic cursor teleportation.

### Fitts's Law

Fitts's Law describes the time required to move a pointer to a target. The Shannon formulation (MacKenzie, 1992), which is the most widely used version, states:

```
T = a + b * log2(D/W + 1)
```

Where `T` is the movement time, `a` is a constant representing reaction/start time, `b` is a constant representing the inherent speed of the input device, `D` is the distance to the target, and `W` is the width (size) of the target. The logarithmic relationship means that doubling the distance adds a fixed amount of time, while halving the target size adds the same fixed amount.

The implications for bot detection are significant. Humans take longer to reach small, distant targets and reach large, nearby targets quickly. They accelerate at the start of a movement, reach peak velocity roughly mid-path, and decelerate as they approach the target. Bots that move the cursor in constant time regardless of distance and target size violate Fitts's Law and are trivially detectable.

Detection systems measure the movement time for each click event, compute the expected time from the distance and target size, and flag movements that are significantly faster than Fitts's Law predicts or that show no correlation between distance/size and movement time.

### Trajectory Shape

Human hand movements between two points are not straight lines. Research by Abend, Bizzi, and Morasso (1982) showed that hand paths are typically curved due to biomechanical constraints of the arm's joints and muscles. Flash and Hogan (1985) demonstrated that human reaching movements follow minimum-jerk trajectories, where the trajectory minimizes the integral of jerk (the derivative of acceleration) over the movement duration. The resulting velocity profile is bell-shaped and is described by a quintic (5th degree) polynomial:

```
x(t) = x0 + (xf - x0) * (10t^3 - 15t^4 + 6t^5)
```

where `t` is normalized time from 0 to 1, and `x0`/`xf` are the start and end positions. This produces smooth acceleration from rest, peak velocity at approximately mid-path, and smooth deceleration back to rest.

Detection systems analyze trajectory curvature, velocity profiles, and acceleration patterns. The specific signals they look for include:

**Straight-line detection.** A perfectly straight path between two points (zero curvature at every sample) is the most obvious bot signal. Human paths always have some curvature due to the arm's rotational joints.

**Constant velocity.** Humans show a bell-shaped velocity profile (accelerate, peak, decelerate). A constant velocity throughout the movement indicates linear interpolation, which is the default behavior of most automation tools.

**Absence of sub-movements.** Long movements are composed of multiple overlapping sub-movements (Meyer et al., 1988), each with its own velocity peak. A movement covering 500+ pixels with a single smooth velocity peak is suspicious; real movements of that distance typically show 2-4 velocity peaks.

**No overshoot.** Humans frequently overshoot the target slightly (by 5-15 pixels) and make a small correction back. Perfectly precise movements that land exactly on target every time are statistically improbable.

### Movement Entropy

Entropy, in this context, measures the unpredictability of the mouse path. Detection systems divide the trajectory into segments, measure the direction change at each point, and compute Shannon entropy over the distribution of direction changes. A straight line has zero entropy (every segment points the same direction). A random walk has maximum entropy. Human movement has moderate-to-high entropy, reflecting the combination of intentional direction and involuntary variability.

Low entropy across many mouse movements in a session is a strong bot signal, even if individual movements have plausible curvature.

### Pydoll's Mouse Humanization

Pydoll implements comprehensive mouse humanization through the `humanize=True` parameter on click operations. When enabled, the mouse module generates movements that address each of the detection vectors described above:

The path follows a cubic Bezier curve with randomized control points, producing natural curvature rather than straight lines. The velocity along the path follows a minimum-jerk profile (`10t^3 - 15t^4 + 6t^5`), producing the bell-shaped velocity curve that Fitts's Law predicts. Movement duration is calculated using Fitts's Law with configurable constants (`a=0.070`, `b=0.150` by default).

Physiological tremor is simulated by adding Gaussian noise to cursor positions, with amplitude scaled inversely to velocity (tremor is more visible when the hand moves slowly, which matches real physiology). Overshoot occurs with 70% probability, overshooting the target by 3-12% of the total distance before making a correction movement. Micro-pauses (15-40ms) occur with 3% probability during the movement, simulating brief hesitations.

```python
# Basic humanized click
await element.click(humanize=True)

# The Mouse class can also be used directly for more control
from pydoll.interactions.mouse import Mouse

mouse = Mouse(connection_handler)
await mouse.click(500, 300, humanize=True)
```

!!! note "What Pydoll Does Not Do"
    Pydoll's mouse humanization does not currently model sub-movements for very long distances (the path is a single Bezier segment). For most web interactions, where distances are under 500 pixels, this is sufficient. Extremely long movements (full-screen diagonal traversals) may benefit from future multi-segment support.

## Keystroke Dynamics

Keystroke dynamics analyzes the timing patterns of keyboard input. The technique dates back to telegraph operators in the 1850s, who could identify each other by their Morse code "fist" (characteristic timing pattern). Modern systems measure timing at millisecond precision through `keydown` and `keyup` events.

### Timing Features

The two fundamental measurements are dwell time (the duration between `keydown` and `keyup` for a single key, typically 50-200ms for humans) and flight time (the duration between releasing one key and pressing the next, typically 80-400ms). The combination of dwell and flight times for consecutive key pairs is called a digraph latency.

Digraph latencies are not uniform. They depend on the specific key pair (bigram) being typed, because typing is a motor skill where common sequences are stored as procedural memory. The key biomechanical factors are:

**Hand alternation.** Bigrams typed with alternating hands (like "th", where "t" is left hand and "h" is right hand on QWERTY) are generally faster than same-hand bigrams (like "de", where both keys are on the left hand). The alternating hand can begin its movement while the first hand is still completing its keystroke.

**Finger distance.** Home-row to home-row transitions are fastest. Reaching to the top or bottom row adds time proportional to the physical distance the finger must travel.

**Finger independence.** Ring finger and pinky combinations on the same hand are slower than index and middle finger combinations, because the ring and pinky fingers share tendons and have less independent motor control.

**Frequency effects.** Frequently typed bigrams (like "th", "er", "in" in English) are executed faster due to motor memory, regardless of their physical layout.

### Detection Signals

Detection systems look for several signals that distinguish human typing from automation:

**Zero or constant dwell time.** Many automation tools dispatch `keydown` and `keyup` events with zero or near-zero delay between them (under 5ms). Real key presses have measurable dwell times. Constant dwell time across all keys is equally suspicious.

**Uniform flight time.** Setting a fixed interval between keystrokes (such as `type_text("hello", interval=0.1)`) produces perfectly regular timing that is trivially detectable. Human flight times vary by bigram, fatigue, and cognitive load.

**No typing errors.** In extended text input (50+ characters), the complete absence of backspace or delete presses is unusual. Humans make mistakes at a rate of roughly 1-5% depending on typing proficiency and text complexity.

**Superhuman speed.** Sustained typing above 150 WPM is beyond the capability of all but elite competitive typists. Automation tools that dispatch characters faster than this are immediately flagged.

### Pydoll's Keyboard Humanization

Pydoll's `type_text(humanize=True)` addresses each detection vector with configurable parameters:

Keystroke delays are drawn from a uniform distribution (30-120ms by default) rather than a fixed interval. Punctuation characters (`.!?;:,`) receive additional delay (80-180ms), simulating the pause that occurs when a typist considers sentence structure. Thinking pauses (300-700ms) occur with 2% probability, simulating brief moments of thought. Distraction pauses (500-1200ms) occur with 0.5% probability, simulating the typist looking away or being briefly interrupted.

Realistic typos occur with approximately 2% probability per character, with five distinct error types weighted by their real-world frequency: adjacent key errors (55%, pressing a neighboring key on QWERTY), transpositions (20%, swapping two consecutive characters), double presses (12%, hitting a key twice), skipped characters (8%, hesitating before typing correctly), and missed spaces (5%, forgetting a space between words). Each error type includes a realistic recovery sequence (pause, backspace, correction) with appropriate timing.

```python
# Humanized typing
await element.type_text("Hello, world!", humanize=True)

# With custom timing configuration
from pydoll.interactions.keyboard import Keyboard, TimingConfig, TypoConfig

config = TimingConfig(
    keystroke_min=0.04,
    keystroke_max=0.15,
    thinking_probability=0.03,
)
keyboard = Keyboard(connection_handler, timing_config=config)
await keyboard.type_text("Custom timing example", humanize=True)
```

!!! note "What Pydoll Does Not Do"
    Pydoll's keyboard humanization uses uniform random delays rather than bigram-aware timing. It does not model per-key dwell time variation or hand-alternation speed differences. For most automation scenarios (form filling, search queries), uniform variation is sufficient to pass behavioral detection. Applications requiring authentication-level keystroke biometric evasion would need custom timing models.

## Scroll Behavior Analysis

Scroll fingerprinting analyzes how users navigate vertically (and horizontally) through page content. The distinction between human and automated scrolling is stark: programmatic `window.scrollTo()` calls produce instant, discrete jumps, while human scrolling via mouse wheel, trackpad, or touch produces a stream of small incremental events with momentum and deceleration.

### Physical Scroll Characteristics

Mouse wheel scrolling produces discrete `wheel` events with consistent delta values (typically 100 or 120 pixels per notch, depending on OS and browser). The events arrive at irregular intervals reflecting how quickly the user turns the wheel. Trackpad scrolling produces many small events with decreasing deltas, simulating physical momentum. Touch scrolling is similar to trackpad but with larger initial deltas and longer deceleration tails.

Detection systems analyze the delta distribution, inter-event timing, and deceleration curve. A `scrollTo(0, 5000)` call produces a single jump with no intermediate events, which is fundamentally different from the hundreds of incremental events that a human scroll generates.

### Detection Signals

**Instant scrolling.** Using `window.scrollTo()` or `window.scrollBy()` with large values produces zero intermediate scroll events. Detection systems that listen for `scroll` events see the scroll position change in a single frame.

**Uniform deltas.** Programmatic scroll simulation that dispatches wheel events with constant delta values (e.g., always 100 pixels) lacks the natural variation in human scrolling, where delta values fluctuate by 10-30% due to inconsistent finger pressure.

**No deceleration.** Human scrolling, especially on trackpads, has a momentum phase where the scroll continues after the user lifts their finger, with exponentially decreasing velocity. Automated scrolling that stops abruptly lacks this deceleration tail.

**Absence of direction changes.** Humans frequently over-scroll and scroll back slightly, or pause partway down a page to read content. Automated scrolling that moves in one direction at constant speed without pauses or reversals is suspicious.

### Pydoll's Scroll Humanization

Pydoll's scroll module implements humanized scrolling through `scroll.by(position, distance, humanize=True)`:

The scroll follows a cubic Bezier easing curve (control points `0.645, 0.045, 0.355, 1.0` by default), producing natural acceleration and deceleration. Per-frame jitter of ±3 pixels adds variation to delta values. Micro-pauses (20-50ms) occur with 5% probability, simulating brief reading stops. Overshoot occurs with 15% probability, scrolling 2-8% past the target and correcting back. For large distances, the scroll is broken into multiple "flick" gestures (100-1200 pixels each), simulating how a real user scrolls through a long page with repeated swipes rather than a single continuous motion.

```python
from pydoll.interactions.scroll import Scroll, ScrollPosition

scroll = Scroll(connection_handler)

# Humanized scroll down by 800 pixels
await scroll.by(ScrollPosition.Y, 800, humanize=True)

# Scroll to top/bottom uses multiple human-like flicks
await scroll.to_bottom(humanize=True)
```

## Additional Detection Vectors

Beyond mouse, keyboard, and scroll analysis, sophisticated detection systems monitor several other behavioral signals.

### Focus and Visibility

The Page Visibility API (`document.visibilityState`) and focus events (`window.onfocus`, `window.onblur`) reveal whether the user is actively viewing the page. A real user's session includes tab switches, window minimizations, and periods of inactivity. An automation script that maintains continuous focus for hours without a single blur event is behaviorally anomalous. Similarly, `document.hasFocus()` returning `true` continuously for extended periods is unusual.

### Idle Patterns

Real users have natural idle periods: reading content, thinking before acting, being distracted. Detection systems measure the distribution of idle times between interactions. A session where every action follows the previous one within 100-500ms with no longer pauses follows a pattern that is statistically distinct from human browsing, where idle periods of 2-30 seconds between actions are normal.

### Event Sequence Integrity

Browsers generate specific event sequences for user interactions. A mouse click produces `pointerdown`, `mousedown`, `pointerup`, `mouseup`, `click` in that order, preceded by `pointermove`/`mousemove` events showing the cursor approaching the click target. Automation tools that dispatch a bare `click` event without the preceding movement and pointer events are detectable through event sequence analysis.

Pydoll's CDP-based event dispatch generates complete event sequences because it uses Chrome's input simulation, which produces the same event chain as real user input.

## Machine Learning Detection

Modern anti-bot systems (DataDome, Akamai Bot Manager, Cloudflare Bot Management, PerimeterX/HUMAN Security) do not use simple threshold rules. They train machine learning models on millions of real user sessions and millions of known bot sessions, learning to distinguish humans from automation based on 50+ features simultaneously.

These models capture statistical properties that are hard to enumerate as individual rules: the joint distribution of movement speed and curvature, the correlation between typing speed and error rate, the relationship between scroll depth and reading time, and the overall "rhythm" of a browsing session. A system that passes every individual check but has subtly wrong correlations between features can still be flagged by a well-trained model.

The practical implication is that behavioral evasion must be consistent across all interaction types, not just individually plausible. Pydoll's `humanize=True` parameter provides a coherent humanization layer across mouse, keyboard, and scroll interactions, but the developer is still responsible for higher-level behavioral plausibility: adding reading delays between page loads, varying the pace of a multi-page workflow, and including natural idle periods.

## References

- Fitts, P. M. (1954). The Information Capacity of the Human Motor System in Controlling the Amplitude of Movement. Journal of Experimental Psychology.
- MacKenzie, I. S. (1992). Fitts' Law as a Research and Design Tool in Human-Computer Interaction. Human-Computer Interaction.
- Flash, T., & Hogan, N. (1985). The Coordination of Arm Movements: An Experimentally Confirmed Mathematical Model. Journal of Neuroscience.
- Abend, W., Bizzi, E., & Morasso, P. (1982). Human Arm Trajectory Formation. Brain.
- Meyer, D. E., Abrams, R. A., Kornblum, S., Wright, C. E., & Smith, J. E. K. (1988). Optimality in Human Motor Performance. Psychological Review.
- Ahmed, A. A. E., & Traore, I. (2007). A New Biometric Technology Based on Mouse Dynamics. IEEE TDSC.


================================================
FILE: docs/en/deep-dive/fingerprinting/browser-fingerprinting.md
================================================
# Browser Fingerprinting

Browser fingerprinting identifies clients by analyzing properties exposed through JavaScript APIs, HTTP headers, and rendering engines. Unlike network fingerprinting, which examines protocol-level signals from the OS kernel and TLS library, browser fingerprinting targets the application layer: the specific browser, its version, its configuration, and the hardware it runs on. These signals are accessible to any website through standard web APIs, and the combination of enough properties creates a fingerprint that is often unique across millions of visitors.

!!! info "Module Navigation"
    - [Network Fingerprinting](./network-fingerprinting.md): TCP/IP, TLS, HTTP/2 protocol fingerprinting
    - [Behavioral Fingerprinting](./behavioral-fingerprinting.md): Mouse, keyboard, scroll analysis
    - [Evasion Techniques](./evasion-techniques.md): Practical countermeasures

## JavaScript Navigator Properties

The `navigator` object is the richest single source of browser fingerprinting data. It exposes dozens of properties that reveal the browser, its capabilities, and the system it runs on. Detection systems collect these properties, cross-reference them against each other and against HTTP headers, and flag inconsistencies.

The following JavaScript collects the core set of properties that fingerprinting systems typically examine:

```javascript
const fingerprint = {
    // Identity
    userAgent: navigator.userAgent,
    platform: navigator.platform,
    vendor: navigator.vendor,

    // Language and locale
    language: navigator.language,
    languages: navigator.languages,

    // Hardware
    hardwareConcurrency: navigator.hardwareConcurrency,
    deviceMemory: navigator.deviceMemory,
    maxTouchPoints: navigator.maxTouchPoints,

    // Features
    cookieEnabled: navigator.cookieEnabled,
    doNotTrack: navigator.doNotTrack,
    webdriver: navigator.webdriver,

    // Screen
    screenWidth: screen.width,
    screenHeight: screen.height,
    colorDepth: screen.colorDepth,
    devicePixelRatio: window.devicePixelRatio,

    // Window chrome (toolbar, scrollbar dimensions)
    chromeHeight: window.outerHeight - window.innerHeight,
    chromeWidth: window.outerWidth - window.innerWidth,

    // Timezone
    timezone: Intl.DateTimeFormat().resolvedOptions().timeZone,
    timezoneOffset: new Date().getTimezoneOffset(),
};
```

Several of these properties deserve individual attention because they carry more fingerprinting weight or are more commonly misconfigured by automation tools.

### Platform and User-Agent Consistency

The `navigator.platform` property returns a string like `Win32`, `MacIntel`, or `Linux x86_64`. Detection systems compare this against the User-Agent header. If the HTTP User-Agent claims `Windows NT 10.0` but `navigator.platform` returns `Linux x86_64`, the mismatch is a strong signal. This is one of the most common mistakes in automation: setting a custom User-Agent via `--user-agent=` without also overriding the platform.

### Hardware Properties

`navigator.hardwareConcurrency` returns the number of logical CPU cores. A value of 1 or 2 suggests a minimal VM or container rather than a real user's machine. `navigator.deviceMemory` reports approximate RAM in gigabytes (0.25, 0.5, 1, 2, 4, 8). This property is only available in Chromium browsers; Firefox and Safari return `undefined`. Both values should be consistent with the claimed device: a User-Agent claiming a modern desktop but reporting 1 core and 0.5 GB of RAM is suspicious.

### WebDriver Property

The `navigator.webdriver` property is `true` when the browser is controlled by WebDriver-based automation (Selenium, Playwright in WebDriver mode). This is the single most obvious automation indicator. Pydoll uses CDP (Chrome DevTools Protocol) directly, which does not set this flag. In a Pydoll-controlled browser, `navigator.webdriver` is `undefined`, matching the behavior of a normal user session.

### Plugins

The `navigator.plugins` property was historically a strong fingerprinting vector because different browsers and OS configurations exposed different plugin lists. Modern Chromium browsers (Chrome 90+) return a fixed list of five PDF-related plugins regardless of actual plugin state:

```javascript
// Modern Chrome always returns these 5 plugins:
// 1. PDF Viewer
// 2. Chrome PDF Viewer
// 3. Chromium PDF Viewer
// 4. Microsoft Edge PDF Viewer
// 5. WebKit built-in PDF
console.log(navigator.plugins.length); // 5
```

A common misconception claims that modern browsers return empty arrays for `navigator.plugins`. This is incorrect. Returning an empty array is itself a detection signal that suggests headless mode or a non-browser HTTP client.

### Screen and Window Dimensions

The gap between `window.outerWidth`/`outerHeight` and `window.innerWidth`/`innerHeight` represents the browser chrome (toolbars, scrollbars, window frame). Headless browsers often report zero difference because they have no visible UI. Detection systems flag clients where `outerWidth` equals `innerWidth` as potentially headless. Similarly, `screen.width` matching `innerWidth` exactly suggests a maximized headless window rather than a normal desktop session.

The `devicePixelRatio` varies by display: standard monitors report `1.0`, MacBook Retina displays report `2.0`, and smartphones report `2.0` to `3.0`. This value should be consistent with the claimed device in the User-Agent.

## User-Agent Client Hints

Modern Chromium browsers (Chrome, Edge, Opera) supplement the traditional User-Agent string with Client Hints headers: `Sec-CH-UA`, `Sec-CH-UA-Platform`, `Sec-CH-UA-Mobile`, and (on request) higher-entropy values like `Sec-CH-UA-Full-Version-List`, `Sec-CH-UA-Arch`, and `Sec-CH-UA-Bitness`.

```http
Sec-CH-UA: "Chromium";v="120", "Google Chrome";v="120", "Not:A-Brand";v="99"
Sec-CH-UA-Mobile: ?0
Sec-CH-UA-Platform: "Windows"
```

Client Hints provide structured, machine-readable data that is harder to spoof inconsistently. A server can compare the `Sec-CH-UA-Platform` header against `navigator.platform`, the User-Agent string, and the TCP/IP fingerprint. Any inconsistency across these layers is a detection signal.

The JavaScript-side equivalent is `navigator.userAgentData`, which exposes `brands`, `mobile`, and `platform` as low-entropy values, and `getHighEntropyValues()` for detailed version, architecture, and bitness information:

```javascript
// Low-entropy (always available, no permission needed)
console.log(navigator.userAgentData.brands);
// [{brand: "Chromium", version: "120"}, {brand: "Google Chrome", version: "120"}, ...]
console.log(navigator.userAgentData.platform); // "Windows"
console.log(navigator.userAgentData.mobile);   // false

// High-entropy (requires promise, may require permission)
const highEntropy = await navigator.userAgentData.getHighEntropyValues([
    'architecture', 'bitness', 'platformVersion', 'uaFullVersion'
]);
// {architecture: "x86", bitness: "64", platformVersion: "15.0.0", ...}
```

!!! warning "Browser Support"
    Client Hints are a Chromium-only feature. Firefox and Safari do not send `Sec-CH-UA` headers and do not expose `navigator.userAgentData`. If the User-Agent claims Firefox but the server receives Client Hints headers, the client is not Firefox.

## Canvas Fingerprinting

Canvas fingerprinting exploits the fact that the HTML5 Canvas API produces subtly different pixel output across different combinations of GPU, graphics driver, OS, and browser. The variation comes from differences in font rasterization (sub-pixel rendering, hinting, anti-aliasing), GPU-specific shader execution, floating-point precision in the graphics pipeline, and OS-level text rendering libraries (DirectWrite on Windows, Core Text on macOS, FreeType on Linux).

The technique draws text, shapes, and gradients onto a hidden canvas, extracts the pixel data, and hashes it:

```javascript
function generateCanvasFingerprint() {
    const canvas = document.createElement('canvas');
    canvas.width = 220;
    canvas.height = 30;
    const ctx = canvas.getContext('2d');

    // Colored rectangle (exposes blending differences)
    ctx.fillStyle = '#f60';
    ctx.fillRect(125, 1, 62, 20);

    // Text with emoji (maximizes rendering variation)
    ctx.font = '14px Arial';
    ctx.textBaseline = 'alphabetic';
    ctx.fillStyle = '#069';
    ctx.fillText('Cwm fjordbank glyphs vext quiz, 😃', 2, 15);

    // Semi-transparent overlay (exposes alpha compositing differences)
    ctx.fillStyle = 'rgba(102, 204, 0, 0.7)';
    ctx.fillText('Cwm fjordbank glyphs vext quiz, 😃', 4, 17);

    return canvas.toDataURL();
}
```

The pangram "Cwm fjordbank glyphs vext quiz" is chosen because it uses unusual character combinations that stress font rendering. The emoji adds another dimension because emoji rendering varies significantly across operating systems. The semi-transparent overlay tests alpha compositing, which differs across GPU implementations.

Canvas fingerprinting is effective for distinguishing broad categories of devices, but its uniqueness is sometimes overstated. Research by Laperdrix et al. (2016) found that canvas fingerprints alone provide moderate distinguishing power, and their real value comes from combining with other signals (WebGL, navigator properties, timezone) to achieve high uniqueness.

!!! note "Canvas Noise Injection"
    Some privacy tools inject random noise into canvas output to break fingerprinting. Detection systems counter this by requesting the canvas fingerprint multiple times in the same session. If the hash changes between requests, noise injection is present, which is itself a detection signal. Randomizing canvas output is therefore counterproductive: it does not prevent identification and it reveals the use of anti-fingerprinting tools.

Since Pydoll controls a real Chrome instance with actual GPU rendering, the canvas fingerprint is authentic and consistent across repeated reads. No injection or spoofing is needed.

## WebGL Fingerprinting

WebGL fingerprinting extends canvas fingerprinting into the 3D rendering pipeline. It is more powerful because it directly exposes hardware identifiers that are difficult to spoof.

The most distinctive data comes from the `WEBGL_debug_renderer_info` extension, which reveals the GPU vendor and model:

```javascript
function getWebGLFingerprint() {
    const canvas = document.createElement('canvas');
    const gl = canvas.getContext('webgl');
    if (!gl) return null;

    // GPU identification (most distinctive)
    const debugInfo = gl.getExtension('WEBGL_debug_renderer_info');
    const vendor = debugInfo
        ? gl.getParameter(debugInfo.UNMASKED_VENDOR_WEBGL)
        : gl.getParameter(gl.VENDOR);
    const renderer = debugInfo
        ? gl.getParameter(debugInfo.UNMASKED_RENDERER_WEBGL)
        : gl.getParameter(gl.RENDERER);

    return {
        vendor,    // e.g. "Google Inc. (NVIDIA)"
        renderer,  // e.g. "ANGLE (NVIDIA, NVIDIA GeForce RTX 3080 Direct3D11 vs_5_0 ps_5_0)"
        version: gl.getParameter(gl.VERSION),
        shadingLanguageVersion: gl.getParameter(gl.SHADING_LANGUAGE_VERSION),
        maxTextureSize: gl.getParameter(gl.MAX_TEXTURE_SIZE),
        extensions: gl.getSupportedExtensions(),
    };
}
```

The renderer string directly names the GPU hardware. A client claiming to be a mobile device but reporting a desktop GPU is obviously inconsistent. Virtual machines often report software renderers like "SwiftShader" or "llvmpipe", which real users almost never have.

Beyond metadata, WebGL can render a 3D scene (a gradient triangle, for instance) and hash the pixel output, producing a render fingerprint analogous to canvas fingerprinting but in the 3D pipeline. The combination of GPU identifiers, supported extensions, parameter limits (`MAX_TEXTURE_SIZE`, `MAX_VIEWPORT_DIMS`), and shader precision formats creates a detailed fingerprint of the graphics stack.

## AudioContext Fingerprinting

The Web Audio API generates fingerprints by processing audio and measuring the output. The standard technique creates an `OscillatorNode`, routes it through a `DynamicsCompressorNode`, and reads the resulting audio samples from an `AnalyserNode` or `OfflineAudioContext`. Differences in audio processing implementations across browsers and OS audio stacks produce distinct output.

```javascript
function getAudioFingerprint() {
    const ctx = new OfflineAudioContext(1, 44100, 44100);
    const oscillator = ctx.createOscillator();
    oscillator.type = 'triangle';
    oscillator.frequency.setValueAtTime(10000, ctx.currentTime);

    const compressor = ctx.createDynamicsCompressor();
    compressor.threshold.setValueAtTime(-50, ctx.currentTime);
    compressor.knee.setValueAtTime(40, ctx.currentTime);
    compressor.ratio.setValueAtTime(12, ctx.currentTime);
    compressor.attack.setValueAtTime(0, ctx.currentTime);
    compressor.release.setValueAtTime(0.25, ctx.currentTime);

    oscillator.connect(compressor);
    compressor.connect(ctx.destination);
    oscillator.start(0);

    return ctx.startRendering().then(buffer => {
        const data = buffer.getChannelData(0);
        // Hash a subset of the audio samples
        let hash = 0;
        for (let i = 4500; i < 5000; i++) {
            hash += Math.abs(data[i]);
        }
        return hash;
    });
}
```

AudioContext fingerprinting is less widely deployed than canvas or WebGL fingerprinting, but it adds another dimension to the overall fingerprint. The signal is particularly useful for distinguishing browsers on the same OS, since audio processing varies more across browser engines than across OS versions.

## Battery Status API

The Battery Status API (`navigator.getBattery()`) exposes the device's battery level, charging status, and estimated charge/discharge times. These values create a short-lived but unique fingerprint for the duration of a session.

This API is only available in Chromium browsers. Firefox removed it in version 52 (2017) citing privacy concerns, and Safari has never implemented it. Detection systems that see Battery API results from a client claiming to be Firefox or Safari know the client is misrepresenting its identity.

## HTTP Header Fingerprinting

Beyond JavaScript APIs, HTTP headers provide fingerprinting signals visible to the server before any JavaScript executes.

### Header Order

Browsers send HTTP headers in a consistent, version-specific order. Chrome places `Sec-CH-UA` headers early, before `User-Agent`. Firefox leads with `User-Agent` followed by `Accept` and `Accept-Language`. Automated HTTP libraries like Python's `requests` or `httpx` send headers in yet another order, typically starting with `Host` and `Connection`.

Detection systems record the order of the first 10-15 headers and compare against known browser signatures. Even if all individual header values are correct, sending them in the wrong order reveals that the request was not generated by the claimed browser. Since Pydoll controls a real Chrome instance, the header order is authentic.

### Accept-Encoding

Modern browsers support Brotli compression (`br`) in addition to `gzip` and `deflate`. Chrome also supports `zstd`. The `Accept-Encoding` for modern Chrome looks like `gzip, deflate, br, zstd`. A client claiming to be Chrome but missing Brotli is either outdated or automated.

### Accept-Language Consistency

The `Accept-Language` header should be consistent with `navigator.language`, `navigator.languages`, the timezone, and the IP geolocation. A request with `Accept-Language: en-US` from an IP in Tokyo with timezone `Asia/Tokyo` is plausible for a traveler but suspicious in combination with other signals. A request with `Accept-Language: zh-CN` and timezone `America/New_York` from a Chinese datacenter IP is a strong proxy indicator.

## Implications for Pydoll

Because Pydoll drives a real Chromium browser through CDP, all browser-level fingerprints are authentic by default. The canvas, WebGL, and AudioContext fingerprints come from actual GPU and audio hardware. The navigator properties, plugins, and screen dimensions reflect the real browser state. HTTP headers, including their order, are generated by Chrome's networking stack.

The main risk in automation is inconsistency across layers. Setting a custom User-Agent without synchronizing related properties creates trivially detectable mismatches. Pydoll handles this automatically: when it detects `--user-agent=` in the browser arguments, it uses `Emulation.setUserAgentOverride` to synchronize the User-Agent string, platform, and full Client Hints metadata across all layers. It also injects `navigator.vendor` and `navigator.appVersion` overrides via `Page.addScriptToEvaluateOnNewDocument` to ensure consistency in newly opened tabs.

For timezone and geolocation consistency (to match a proxy IP's location), JavaScript overrides can set `Intl.DateTimeFormat().resolvedOptions().timeZone` and `Date.prototype.getTimezoneOffset`. The `--lang` flag and `set_accept_languages()` configure language headers. The `webrtc_leak_protection` option prevents WebRTC from exposing the real IP behind a proxy.

The general principle is that Pydoll provides the authentic browser fingerprint as a baseline, and the developer only needs to ensure that the configurable layers (User-Agent, timezone, language, geolocation) are consistent with each other and with the proxy's characteristics.

## References

- Laperdrix, P., Rudametkin, W., & Baudry, B. (2016). Beauty and the Beast: Diverting Modern Web Browsers to Build Unique Browser Fingerprints. IEEE S&P.
- Mowery, K., & Shacham, H. (2012). Pixel Perfect: Fingerprinting Canvas in HTML5. USENIX Security.
- Eckersley, P. (2010). How Unique Is Your Web Browser? Privacy Enhancing Technologies Symposium.
- W3C Client Hints Infrastructure: https://wicg.github.io/client-hints-infrastructure/
- BrowserLeaks: https://browserleaks.com/
- CreepJS: https://abrahamjuliot.github.io/creepjs/


================================================
FILE: docs/en/deep-dive/fingerprinting/evasion-techniques.md
================================================
# Evasion Techniques

This document covers practical techniques for evading fingerprinting detection using Pydoll. The previous sections described how detection works at each layer: [network fingerprinting](./network-fingerprinting.md) (TCP/IP, TLS, HTTP/2), [browser fingerprinting](./browser-fingerprinting.md) (Canvas, WebGL, navigator properties), and [behavioral fingerprinting](./behavioral-fingerprinting.md) (mouse, keyboard, scroll). This section focuses on countermeasures.

The core principle is consistency across layers. Passing one detection layer while failing another still results in a flag. A residential IP with a mismatched TCP fingerprint, or a perfect browser fingerprint with robotic mouse movements, will be caught by any system that correlates signals.

!!! info "Module Navigation"
    - [Network Fingerprinting](./network-fingerprinting.md): Protocol-level identification
    - [Browser Fingerprinting](./browser-fingerprinting.md): Application-layer detection
    - [Behavioral Fingerprinting](./behavioral-fingerprinting.md): Human behavior analysis

## What Pydoll Provides by Default

Before configuring anything, it helps to understand what Pydoll gives you for free by using a real Chrome instance via CDP.

**Authentic network fingerprints.** Chrome's TCP/IP stack, TLS implementation (BoringSSL), and HTTP/2 stack produce genuine fingerprints. The TLS ClientHello, HTTP/2 SETTINGS frame, pseudo-header order, and stream priorities all match a real Chrome browser. Tools that construct HTTP requests programmatically (requests, httpx, curl) produce non-browser fingerprints at these layers. With Pydoll, they are authentic by default.

**Authentic browser fingerprints.** Canvas, WebGL, and AudioContext fingerprints come from real GPU and audio hardware. Navigator properties, plugins (the standard 5 PDF plugins), and MIME types reflect genuine browser state. There is nothing to configure here.

**No `navigator.webdriver`.** Selenium, Playwright, and Puppeteer set `navigator.webdriver` to `true`. Pydoll uses CDP directly, which does not set this flag. The property is `undefined`, matching a normal user session.

**Complete event sequences.** When Pydoll dispatches input events through CDP's Input domain, Chrome generates the full event chain (pointermove, pointerdown, mousedown, pointerup, mouseup, click) exactly as it would for real user input.

## User-Agent Consistency

The most common fingerprinting inconsistency in automation is a mismatch between the HTTP `User-Agent` header, `navigator.userAgent` in JavaScript, `navigator.platform`, and Client Hints headers (`Sec-CH-UA`, `Sec-CH-UA-Platform`). Setting `--user-agent=` as a Chrome flag only changes the HTTP header, leaving JavaScript properties and Client Hints unchanged.

Pydoll solves this automatically. When it detects `--user-agent=` in the browser arguments, it:

1. Parses the UA string to extract browser name, version, and OS.
2. Calls `Emulation.setUserAgentOverride` via CDP with the full `userAgent`, the correct `platform` value (e.g., `Win32` for Windows), and complete `userAgentMetadata` (Client Hints data including `Sec-CH-UA`, `Sec-CH-UA-Platform`, `Sec-CH-UA-Full-Version-List`).
3. Injects `navigator.vendor` and `navigator.appVersion` overrides via `Page.addScriptToEvaluateOnNewDocument`, ensuring consistency even in newly opened tabs.

```python
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.add_argument(
    '--user-agent=Mozilla/5.0 (Windows NT 10.0; Win64; x64) '
    'AppleWebKit/537.36 (KHTML, like Gecko) '
    'Chrome/120.0.6099.109 Safari/537.36'
)

async with Chrome(options=options) as browser:
    tab = await browser.start()
    # All layers are now consistent:
    # - HTTP User-Agent header
    # - navigator.userAgent / navigator.platform / navigator.appVersion
    # - Sec-CH-UA / Sec-CH-UA-Platform / Sec-CH-UA-Full-Version-List
    # - navigator.userAgentData.brands / .platform
    await tab.go_to('https://example.com')
```

This override is applied automatically to the initial tab, new tabs from `browser.new_tab()`, and any tabs discovered via `browser.get_opened_tabs()`.

!!! note "Supported Platforms"
    The UA parser handles Chrome, Edge, Windows (NT 6.1 through 10.0), macOS, Linux, Android, iOS, and Chrome OS. It generates proper GREASE brand values following the Chromium specification.

## Timezone and Locale Consistency

When using a proxy, the browser's timezone and language should match the proxy IP's geographic location. An IP geolocated to Tokyo with a browser timezone of `America/New_York` and `Accept-Language: en-US` is a detectable inconsistency.

### Language Configuration

Language is configured through Chrome flags and Pydoll's options API:

```python
options = ChromiumOptions()
options.add_argument('--lang=ja-JP')
options.set_accept_languages('ja-JP,ja;q=0.9,en;q=0.8')
```

This sets both the `Accept-Language` HTTP header and `navigator.language` / `navigator.languages`.

### Timezone Override

Pydoll does not currently wrap CDP's `Emulation.setTimezoneOverride` command, so timezone override requires JavaScript injection. The critical APIs to override are `Intl.DateTimeFormat().resolvedOptions().timeZone` and `Date.prototype.getTimezoneOffset()`:

```python
async def set_timezone(tab, timezone_id: str, offset_minutes: int):
    """
    Override timezone via JavaScript.

    Args:
        timezone_id: IANA timezone name (e.g., 'Asia/Tokyo')
        offset_minutes: UTC offset in minutes (e.g., -540 for JST)
    """
    script = f'''
        const _origDTF = Intl.DateTimeFormat;
        Intl.DateTimeFormat = function(...args) {{
            const opts = args[1] || {{}};
            opts.timeZone = '{timezone_id}';
            return new _origDTF(args[0], opts);
        }};
        Object.defineProperty(Intl.DateTimeFormat, 'prototype', {{
            value: _origDTF.prototype
        }});
        Date.prototype.getTimezoneOffset = function() {{ return {offset_minutes}; }};
    '''
    await tab.execute_script(script)
```

!!! warning "`execute_script` vs `addScriptToEvaluateOnNewDocument`"
    `tab.execute_script()` runs JavaScript in the current page context. If the page navigates, the override is lost. For overrides that must persist across navigations, use CDP's `Page.addScriptToEvaluateOnNewDocument`, which injects the script before any page JavaScript runs on every new document load. Pydoll uses this internally for User-Agent overrides. For timezone, you can send the CDP command directly:

    ```python
    await tab._connection_handler.execute_command(
        'Page.addScriptToEvaluateOnNewDocument',
        {'source': script}
    )
    ```

### Geolocation Override

For sites that request geolocation permission, the Geolocation API can be overridden via JavaScript:

```python
async def set_geolocation(tab, latitude: float, longitude: float):
    script = f'''
        navigator.geolocation.getCurrentPosition = function(success) {{
            success({{
                coords: {{
                    latitude: {latitude}, longitude: {longitude},
                    accuracy: 1, altitude: null, altitudeAccuracy: null,
                    heading: null, speed: null
                }},
                timestamp: Date.now()
            }});
        }};
        navigator.geolocation.watchPosition = function(success) {{
            return navigator.geolocation.getCurrentPosition(success);
        }};
    '''
    await tab.execute_script(script)
```

## WebRTC Leak Protection

WebRTC can expose the client's real IP address even when using a proxy, through STUN/TURN server requests that bypass the proxy tunnel. Pydoll provides a built-in option to prevent this:

```python
options = ChromiumOptions()
options.webrtc_leak_protection = True
# Adds: --force-webrtc-ip-handling-policy=disable_non_proxied_udp
```

This forces Chrome to route all WebRTC traffic through the proxy, preventing IP leakage. It should be enabled whenever using a proxy for stealth automation.

## Behavioral Humanization

Pydoll implements humanized interactions for mouse, keyboard, and scroll through the `humanize=True` parameter. These are not future features or manual workarounds; they are built into the framework.

### Mouse

```python
# Humanized click: Bezier curve path, Fitts's Law timing,
# minimum-jerk velocity, tremor, overshoot + correction
await element.click(humanize=True)
```

When `humanize=True` is passed to a WebElement's `click()`, Pydoll generates a complete mouse movement from the current cursor position to the element using a cubic Bezier curve with randomized control points. The velocity follows a minimum-jerk profile. Physiological tremor, overshoot (70% probability), and micro-pauses are added. The movement duration is computed from Fitts's Law based on the distance and target size. See [Behavioral Fingerprinting](./behavioral-fingerprinting.md#pydolls-mouse-humanization) for detailed parameter descriptions.

### Keyboard

```python
# Humanized typing: variable delays, realistic typos (~2%),
# punctuation pauses, thinking pauses, distraction pauses
await element.type_text("Hello, world!", humanize=True)
```

Humanized typing uses variable inter-key delays (30-120ms uniform distribution), punctuation pauses, thinking pauses (2% probability), distraction pauses (0.5% probability), and realistic typos with five distinct error types and natural correction sequences. See [Behavioral Fingerprinting](./behavioral-fingerprinting.md#pydolls-keyboard-humanization) for the full parameter breakdown.

### Scroll

```python
from pydoll.interactions.scroll import Scroll, ScrollPosition

scroll = Scroll(connection_handler)
# Humanized scroll: Bezier easing, jitter, micro-pauses, overshoot
await scroll.by(ScrollPosition.Y, 800, humanize=True)
```

Humanized scrolling uses Bezier easing curves, per-frame jitter (±3px), micro-pauses (5% probability), and overshoot correction (15% probability). Large distances are broken into multiple "flick" gestures. See [Behavioral Fingerprinting](./behavioral-fingerprinting.md#pydolls-scroll-humanization) for details.

## Request Interception

Pydoll supports request interception via CDP's Fetch domain, allowing you to modify headers, block requests, or provide custom responses before they reach the server:

```python
from pydoll.protocol.fetch.events import FetchEvent

async def handle_request(event):
    request_id = event['params']['requestId']
    request = event['params']['request']
    headers = request.get('headers', {})

    # Example: ensure Brotli support is advertised
    if 'Accept-Encoding' in headers and 'br' not in headers['Accept-Encoding']:
        headers['Accept-Encoding'] = 'gzip, deflate, br, zstd'

    header_list = [{'name': k, 'value': v} for k, v in headers.items()]
    await tab.continue_request(request_id=request_id, headers=header_list)

await tab.enable_fetch_events()
await tab.on(FetchEvent.REQUEST_PAUSED, handle_request)
```

In practice, header modification is rarely needed with Pydoll because Chrome generates correct headers natively. Request interception is more useful for blocking tracking scripts, modifying response content, or debugging.

## Browser Preferences for Realism

Chrome stores user preferences that fingerprinting systems can inspect. A brand-new browser profile with no history, no saved preferences, and default-everything looks different from a profile that has been used for weeks. Pydoll's `browser_preferences` option lets you pre-populate these:

```python
import time

options = ChromiumOptions()
options.browser_preferences = {
    'profile': {
        'created_by_version': '120.0.6099.130',
        'creation_time': str(time.time() - 90 * 86400),  # 90 days ago
        'exit_type': 'Normal',
    },
    'profile.default_content_setting_values': {
        'cookies': 1,
        'images': 1,
        'javascript': 1,
        'notifications': 2,  # "Ask" (realistic default)
    },
}
```

## Common Mistakes

### Randomizing Everything

Generating a random fingerprint from scratch (random hardwareConcurrency, random deviceMemory, random screen size) creates impossible combinations. Real devices have constrained configurations: a 4-core machine with 8 GB RAM, 1920x1080 screen, and Windows 10 is a plausible profile. A 17-core machine with 0.5 GB RAM, 3840x2160 screen, and `navigator.platform: Linux armv7l` is not. Use profiles captured from real browsers rather than random generation.

### Canvas Noise Injection

Adding random noise to canvas output to prevent fingerprinting is counterproductive. Detection systems request the fingerprint multiple times. If the hash changes between requests, noise injection is detected, which is itself a strong automation signal. With Pydoll, the canvas fingerprint is authentic and consistent. Leave it alone.

### Outdated User-Agents

Using a User-Agent from a browser version that is 6+ months old is detectable because the version lacks features and Client Hints values that the current release would have. Keep User-Agent strings current within the last 2-3 major Chrome versions.

### Ignoring Session-Level Behavior

Even with perfect fingerprints and humanized interactions, session-level behavior matters. Loading 100 pages in 60 seconds, never scrolling, clicking only buttons (never links), and maintaining constant focus for hours without a single tab switch or idle period are all behavioral anomalies. Add reading delays between navigations, vary the pace of multi-page workflows, and include natural idle periods.

## Verification

Before deploying automation at scale, verify your fingerprint using these tools:

| Tool | URL | Tests |
|------|-----|-------|
| BrowserLeaks | https://browserleaks.com/ | Canvas, WebGL, fonts, IP, WebRTC, HTTP/2 |
| CreepJS | https://abrahamjuliot.github.io/creepjs/ | Lie detection, consistency checks |
| Fingerprint.com | https://fingerprint.com/demo/ | Commercial-grade identification |
| PixelScan | https://pixelscan.net/ | Bot detection analysis |
| IPLeak | https://ipleak.net/ | WebRTC, DNS, IP leaks |

A basic verification script with Pydoll:

```python
async def verify_fingerprint(tab):
    result = await tab.execute_script('''
        return {
            userAgent: navigator.userAgent,
            platform: navigator.platform,
            webdriver: navigator.webdriver,
            languages: navigator.languages,
            plugins: navigator.plugins.length,
            timezone: Intl.DateTimeFormat().resolvedOptions().timeZone,
            colorDepth: screen.colorDepth,
            deviceMemory: navigator.deviceMemory,
            hardwareConcurrency: navigator.hardwareConcurrency,
        };
    ''')
    fp = result['result']['result']['value']

    # Check for obvious issues
    assert fp['webdriver'] is None, 'navigator.webdriver should be undefined'
    assert fp['plugins'] == 5, f'Expected 5 plugins, got {fp["plugins"]}'
    assert 'HeadlessChrome' not in fp['userAgent'], 'Headless detected in UA'
```

## References

- Chrome DevTools Protocol, Emulation Domain: https://chromedevtools.github.io/devtools-protocol/tot/Emulation/
- Chrome DevTools Protocol, Fetch Domain: https://chromedevtools.github.io/devtools-protocol/tot/Fetch/
- Chromium Source, Inspector Emulation Agent: https://source.chromium.org/chromium/chromium/src/+/main:third_party/blink/renderer/core/inspector/inspector_emulation_agent.cc


================================================
FILE: docs/en/deep-dive/fingerprinting/index.md
================================================
# Browser & Network Fingerprinting

This module covers browser and network fingerprinting, a critical aspect of modern web automation and detection systems.

Fingerprinting sits at the intersection of network protocols, cryptography, browser internals, and behavioral analysis. It encompasses the techniques used to identify and track devices, browsers, and users across sessions without relying on traditional identifiers like cookies or IP addresses.

## Why This Matters

Every browser connection to a website exposes multiple characteristics, from the precise order of TCP options in network packets, to GPU-specific canvas rendering, to JavaScript execution timing patterns. Individually, these characteristics may appear innocuous. Combined, they create a fingerprint that can uniquely identify a device or browser instance.

For automation engineers, bot developers, and privacy-conscious users, understanding fingerprinting is essential for building effective detection evasion systems and understanding how tracking mechanisms operate at a technical level.

!!! danger "Multi-Layer Detection Systems"
    Modern anti-bot systems employ comprehensive analysis across multiple layers:
    
    - **Network-level**: TCP/IP stack behavior, TLS handshake patterns, HTTP/2 settings
    - **Browser-level**: Canvas rendering, WebGL vendor strings, JavaScript property enumeration
    - **Behavioral**: Mouse movement entropy, keystroke timing, scroll patterns
    
    A single inconsistency (such as a Chrome User-Agent with Firefox TLS fingerprint) can trigger immediate blocking.

## Module Scope and Methodology

Fingerprinting techniques are documented across multiple sources with varying levels of accessibility and reliability:

- Academic papers (often paywalled and theoretical)
- Browser source code (millions of lines to analyze)
- Security researcher blogs (technical but fragmented)
- Anti-bot vendor whitepapers (marketing-focused, details omitted)
- Underground forums (practical but unreliable)

This module centralizes, validates, and organizes this knowledge into a cohesive technical guide. Every technique described here has been:

- **Verified** against browser source code and RFCs
- **Tested** in real automation scenarios
- **Cited** with authoritative references
- **Explained** from first principles to implementation  

## Module Structure

This module is organized into three progressive layers, from network fundamentals to practical evasion techniques:

### 1. Network-Level Fingerprinting
**[Network Fingerprinting](./network-fingerprinting.md)**

Covers device identification through network behavior at the transport and session layers, before browser rendering begins.

- **TCP/IP fingerprinting**: TTL, window size, option ordering
- **TLS fingerprinting**: JA3/JA4, cipher suites, ALPN negotiation
- **HTTP/2 fingerprinting**: SETTINGS frames, priority patterns
- **Tools & techniques**: p0f, Nmap, Scapy, tshark analysis

**Technical significance**: Network fingerprints are the most challenging to spoof because they require OS-level modifications. Inconsistencies at this layer are detected before JavaScript execution begins.

### 2. Browser-Level Fingerprinting
**[Browser Fingerprinting](./browser-fingerprinting.md)**

Examines browser identification through JavaScript APIs, rendering engines, and plugin ecosystems at the application layer.

- **Canvas & WebGL fingerprinting**: GPU-specific rendering artifacts
- **Audio fingerprinting**: Subtle differences in audio API output
- **Font enumeration**: Installed fonts reveal OS and locale
- **JavaScript properties**: Navigator object, screen dimensions, timezone
- **Header analysis**: Accept-Language, User-Agent consistency

**Technical significance**: This layer accounts for the majority of detection events. Even with correct network-level fingerprints, exposed automation properties (e.g., `navigator.webdriver`) can trigger blocking.

### 3. Behavioral Fingerprinting
**[Behavioral Fingerprinting](./behavioral-fingerprinting.md)**

Analyzes user interaction patterns to distinguish human behavior from automated systems.

- **Mouse movement analysis**: Trajectory curvature, velocity profiles, Fitts's Law compliance
- **Keystroke dynamics**: Typing rhythm, dwell time, flight time, bigram patterns
- **Scroll patterns**: Momentum, inertia, deceleration curves
- **Event sequences**: Natural interaction ordering (mousemove → click), timing analysis
- **Machine learning**: ML models trained on billions of behavioral signals

**Technical significance**: Behavioral analysis can detect automation even when network and browser fingerprints are correctly spoofed. This layer is particularly challenging because it requires replicating biomechanical human behavior patterns.

### 4. Evasion Techniques
**[Evasion Techniques](./evasion-techniques.md)**

Practical implementation of fingerprinting evasion using Pydoll's CDP integration, JavaScript overrides, and architectural features.

- **CDP-based spoofing**: Timezone, geolocation, device metrics
- **JavaScript property overrides**: Redefining navigator objects, canvas poisoning
- **Request interception**: Forcing header consistency
- **Behavioral mimicry**: Human-like timing, entropy injection
- **Detection testing**: Tools to validate your evasion setup

**Technical significance**: This section demonstrates practical application of fingerprinting concepts to real automation scenarios, integrating techniques from all previous layers.

## Who Should Read This

### **You MUST read this if you're:**
- Building automation that interacts with anti-bot protected sites
- Developing scraping infrastructure at scale
- Implementing privacy-preserving browser automation
- Researching bot detection for offensive or defensive purposes

### **This is advanced material if you're:**
- New to network protocols (start with [Network Fundamentals](../network/network-fundamentals.md))
- Unfamiliar with CDP (read [Chrome DevTools Protocol](../fundamentals/cdp.md) first)
- Just learning Python typing (see [Type System](../fundamentals/typing-system.md))

### **This is NOT:**
- A "silver bullet" anti-detection solution (no such thing exists)
- Legal advice on web scraping (consult [Legal & Ethical](../network/proxy-legal.md))
- A replacement for respecting robots.txt and rate limits

## The Technical Philosophy

Fingerprinting defense is **not about becoming invisible**—it's about becoming **indistinguishable from legitimate traffic**. This means:

1. **Consistency over perfection**: A perfectly configured Firefox fingerprint is better than a "perfect" but inconsistent Chrome fingerprint
2. **Holistic approach**: You must align network, browser, and behavioral layers
3. **Continuous adaptation**: Fingerprinting techniques evolve monthly; this is a living document

!!! tip "The Golden Rule"
    **Every layer must tell the same story.** If your TLS fingerprint says "Chrome 120", your HTTP/2 settings must match Chrome 120, your User-Agent must say Chrome 120, and your canvas rendering must produce Chrome 120 artifacts. One mismatch = detection.

## Ethical Considerations

Fingerprinting knowledge is **dual-use technology**:

- **Defensive**: Protect your privacy from invasive tracking
- **Offensive**: Evade detection systems for automation

We trust you to use this knowledge **responsibly and ethically**:

**Recommended practices:**

- Respect website terms of service
- Implement rate limiting and respectful crawling patterns
- Evaluate whether automation is necessary
- Be transparent when appropriate

**Prohibited uses:**

- Fraud, account abuse, or illegal activities
- Overwhelming servers with aggressive scraping
- Weaponizing this knowledge without understanding consequences  

## Ready to Dive Deep?

Fingerprinting is a complex and technical domain that requires systematic study. Understanding these techniques is essential for effective web automation in environments with detection systems.

Begin with **[Network Fingerprinting](./network-fingerprinting.md)** to establish foundational knowledge, continue with **[Browser Fingerprinting](./browser-fingerprinting.md)** for application-layer understanding, and conclude with **[Evasion Techniques](./evasion-techniques.md)** for practical implementation.

---

!!! info "Documentation Status"
    This module represents **extensive research** combining academic papers, browser source code, real-world testing, and community knowledge. Every claim is cited and validated. If you find inaccuracies or have updates, contributions are welcome.

## Further Reading

Before diving in, consider these complementary topics:

- **[Proxy Architecture](../network/http-proxies.md)**: Network-level anonymity fundamentals
- **[Browser Preferences](../../features/configuration/browser-preferences.md)**: Practical fingerprint configuration
- **[Behavioral Captcha Bypass](../../features/advanced/behavioral-captcha-bypass.md)**: Behavioral analysis and evasion


================================================
FILE: docs/en/deep-dive/fingerprinting/network-fingerprinting.md
================================================
# Network Fingerprinting

Network fingerprinting identifies clients by analyzing characteristics of the TCP/IP stack, TLS handshake, and HTTP/2 connection. These signals are set by the operating system kernel and the TLS library, not by the browser's JavaScript environment, which makes them harder to spoof than browser-level fingerprints. A proxy or VPN changes your IP address but does not alter your TCP window size, your TLS cipher suite list, or your HTTP/2 SETTINGS frame. Detection systems exploit this gap.

!!! info "Module Navigation"
    - [Browser Fingerprinting](./browser-fingerprinting.md): Canvas, WebGL, AudioContext
    - [Evasion Techniques](./evasion-techniques.md): Multi-layer countermeasures

    For protocol fundamentals, see [Network Fundamentals](../network/network-fundamentals.md). For proxy detection context, see [Proxy Detection](../network/proxy-detection.md).

## TCP/IP Fingerprinting

Every operating system implements the TCP/IP stack differently. The SYN packet that initiates a TCP connection carries enough information to identify the OS with high confidence: the initial TTL, the TCP window size, the Maximum Segment Size, and the order and selection of TCP options. None of these values are controlled by the browser. They come from the kernel.

### TTL (Time To Live)

The initial TTL is one of the simplest OS identifiers. Linux and macOS set it to 64, Windows sets it to 128, and network devices (routers, firewalls) typically use 255. Each router hop decrements the TTL by one, so a packet arriving with TTL 118 likely started at 128 (Windows) and crossed 10 hops.

The fingerprinting value of TTL comes from cross-referencing it with the User-Agent. If the browser claims to be Chrome on Windows but the packet arrives with a TTL near 64, the connection is either proxied through a Linux server or the User-Agent is spoofed. Detection systems round the observed TTL up to the nearest known initial value (64, 128, 255) and compare it against the claimed OS.

When traffic flows through a proxy, the TTL resets because the proxy's kernel generates a new TCP connection to the target. The target sees the proxy's TTL, not yours. This is why TTL mismatches are a proxy detection signal: the User-Agent says Windows (TTL 128) but the TCP fingerprint shows Linux (TTL 64).

### TCP Window Size and Scaling

The initial TCP window size in the SYN packet varies by OS and kernel version. Modern Linux kernels (3.x and later) typically send an initial window of 29200 bytes, which is `20 * MSS` where MSS is 1460 for standard Ethernet. Some newer kernels (5.x, 6.x) may use 64240 depending on configuration and `initcwnd` settings. Windows 10 and 11 typically send 65535 with window scaling enabled, though the exact value depends on auto-tuning configuration and patch level. macOS also defaults to 65535.

The window scale factor (a TCP option) multiplies the 16-bit window size field to support larger receive windows. Linux commonly uses a scale factor of 7 (allowing windows up to 8MB), while Windows often uses 8. Combined with the base window size, the scale factor creates a more granular fingerprint than either value alone.

### TCP Options Order

The selection and ordering of TCP options in the SYN packet is highly distinctive. Each OS arranges options in a fixed, version-specific order that the kernel does not expose as a configurable parameter. Linux sends `MSS, SACK_PERM, TIMESTAMP, NOP, WSCALE`. Windows sends `MSS, NOP, WSCALE, NOP, NOP, SACK_PERM` and notably omits the TIMESTAMP option in default configurations. macOS sends `MSS, NOP, WSCALE, NOP, NOP, TIMESTAMP, SACK_PERM`.

The presence or absence of specific options matters as much as the order. Windows historically omitted TCP timestamps, which Linux and macOS include by default. SACK (Selective Acknowledgment) is supported by all modern systems, but older or embedded systems may not advertise it. The combination of which options appear and in what order creates a signature that tools like p0f match against a database of known OS fingerprints.

### p0f

[p0f](https://lcamtuf.coredump.cx/p0f3/) is the standard tool for passive TCP/IP fingerprinting. It observes traffic without generating any packets, analyzing SYN and SYN+ACK packets against a signature database. Its signature format encodes the key fingerprinting fields:

```
version:ittl:olen:mss:wsize,scale:olayout:quirks:pclass
```

The `ittl` is the inferred initial TTL, `mss` is the Maximum Segment Size, `wsize,scale` is the window size (which can be absolute, or relative to MSS like `mss*20`), and `olayout` is the TCP options layout using shorthand names (`mss`, `nop`, `ws`, `sok`, `sack`, `ts`, `eol+N`). The `quirks` field captures unusual behaviors like the Don't Fragment flag (`df`) or non-zero IP ID on DF packets (`id+`).

A typical Linux 4.x+ signature in p0f looks like `4:64:0:*:mss*20,7:mss,sok,ts,nop,ws:df,id+:0`. A Windows 10 signature might look like `4:128:0:*:65535,8:mss,nop,ws,nop,nop,sok:df,id+:0`. Anti-bot services maintain similar databases internally, matching incoming connections against known OS profiles and flagging mismatches with the declared User-Agent.

## TLS Fingerprinting

The TLS ClientHello message is transmitted before encryption is established, so it is visible to any observer on the network path. It contains the TLS version, supported cipher suites, TLS extensions, supported elliptic curves (named groups), and EC point formats. Each browser and TLS library produces a characteristic combination of these fields.

### JA3

JA3, developed at Salesforce by John Althouse, Jeff Atkinson, and Josh Atkins, was the first widely adopted TLS fingerprinting method. It concatenates five fields from the ClientHello (TLS version, cipher suites, extensions, elliptic curves, EC point formats), joins values within each field with hyphens, separates the five fields with commas, and takes the MD5 hash of the resulting string.

```
JA3 string: 771,4865-4866-4867-49195-49199-49196-49200-52393-52392,0-23-65281-10-11-35-16-5-13-18-51-45-43-27-17513,29-23-24,0
JA3 hash:   cd08e31494b9531f560d64c695473da9
```

One subtlety: the "TLS version" field in JA3 uses `ClientHello.legacy_version`, not the `supported_versions` extension. Since TLS 1.3 (RFC 8446) requires clients to set `legacy_version` to `0x0303` (TLS 1.2) for backwards compatibility, the JA3 version field is almost always `771` for modern clients, even when they support TLS 1.3. The actual TLS 1.3 negotiation happens through extension 43 (`supported_versions`), but JA3 uses the header field.

JA3 must filter GREASE values before hashing. GREASE (RFC 8701) is a mechanism where browsers insert randomly selected reserved values into cipher suites, extensions, and other fields to prevent protocol ossification. The valid GREASE values are `0x0a0a`, `0x1a1a`, `0x2a2a`, and so on up to `0xfafa`. Each value has two identical bytes where the low nibble of each byte is `0x0a`. A correct GREASE filter checks both conditions:

```python
def is_grease(value: int) -> bool:
    return (value & 0x0f0f) == 0x0a0a and (value >> 8) == (value & 0xff)
```

!!! warning "JA3 Limitations with Modern Browsers"
    Since Chrome 110 (January 2023) and Firefox 114, browsers randomize the order of TLS extensions in every connection. This means the same browser produces different JA3 hashes on every connection, making JA3 effectively useless for identifying modern browsers. JA3 remains useful for fingerprinting non-browser clients (Python `requests`, `curl`, custom bots) that do not implement extension randomization.

### JA4

JA4 is the successor to JA3, developed by the same lead author (John Althouse) at FoxIO. It was designed specifically to survive TLS extension randomization by sorting extensions and cipher suites before hashing. The format consists of three sections separated by underscores: `a_b_c`.

Section `a` is a human-readable string of metadata: the protocol (`t` for TCP, `q` for QUIC), the TLS version (`12` or `13`), whether SNI is present (`d` for domain, `i` for IP), the number of cipher suites (two digits), the number of extensions (two digits), and the first and last ALPN value (`h2` for HTTP/2, `00` if none). For example, `t13d1516h2` means TCP TLS 1.3 with SNI, 15 cipher suites, 16 extensions, and HTTP/2 ALPN.

Section `b` is a truncated SHA-256 hash of the sorted cipher suites. Section `c` is a truncated SHA-256 hash of the sorted extensions concatenated with the signature algorithms. Because both lists are sorted before hashing, extension randomization does not affect the output.

Cloudflare, AWS, and other major platforms have adopted JA4. The full JA4+ suite also includes JA4S (server fingerprinting), JA4H (HTTP client fingerprinting), JA4X (X.509 certificate fingerprinting), and JA4SSH (SSH fingerprinting). The specification and tools are available at [github.com/FoxIO-LLC/ja4](https://github.com/FoxIO-LLC/ja4).

### JA3S (Server Fingerprinting)

JA3S applies the same concept to the ServerHello message, but the format is simpler because the server selects a single cipher suite rather than offering a list. The JA3S string is `version,cipher,extensions` and its MD5 hash identifies the server's TLS implementation. Pairing JA3 (or JA4) with JA3S creates a bidirectional fingerprint: a specific client talking to a specific server produces a predictable JA3+JA3S pair, which is more distinctive than either fingerprint alone.

### How Proxies Interact with TLS Fingerprints

The type of proxy determines whether the TLS fingerprint is preserved. SOCKS5 proxies and HTTP CONNECT tunnels relay the TCP stream without terminating TLS, so the target server sees the original client's TLS fingerprint unchanged. This is the main advantage of these proxy types for fingerprint consistency.

MITM proxies (which terminate TLS and re-establish a new connection to the target) replace the client's TLS fingerprint with their own. The target sees the proxy software's cipher suites and extensions, not the browser's. If the proxy uses a standard TLS library like OpenSSL or BoringSSL with default settings, the fingerprint will not match any known browser, which is itself a detection signal.

This is why Pydoll's approach of using `--proxy-server` (which creates a CONNECT tunnel, preserving the browser's TLS fingerprint) is preferable to external MITM proxy setups for stealth automation.

## HTTP/2 Fingerprinting

HTTP/2 connections expose a separate set of fingerprinting signals that are distinct from TLS. The first frame sent by the client is a SETTINGS frame containing parameters like `HEADER_TABLE_SIZE`, `ENABLE_PUSH`, `MAX_CONCURRENT_STREAMS`, `INITIAL_WINDOW_SIZE`, `MAX_FRAME_SIZE`, and `MAX_HEADER_LIST_SIZE`. Each browser uses different default values and includes different subsets of these parameters.

Beyond SETTINGS, the WINDOW_UPDATE frame size, the priority/weight of the initial stream, and the order of HTTP/2 pseudo-headers (`:method`, `:authority`, `:scheme`, `:path`) vary between implementations. Chrome, Firefox, and Safari each produce a distinctive combination of these values.

Akamai published the foundational research on HTTP/2 fingerprinting at Black Hat Europe 2017. Their fingerprint format concatenates the SETTINGS values, WINDOW_UPDATE size, PRIORITY frames, and pseudo-header order. The JA4+ suite includes `JA4H` for HTTP-level fingerprinting, covering header order and values.

HTTP/2 fingerprinting is particularly effective against automation tools because many bot frameworks and HTTP libraries implement their own HTTP/2 stacks with default parameters that do not match any real browser. Even when a tool correctly spoofs the TLS fingerprint (using curl-impersonate or similar), its HTTP/2 SETTINGS frame may betray it.

You can check your HTTP/2 fingerprint at [browserleaks.com/http2](https://browserleaks.com/http2). Because Pydoll controls a real Chrome instance via CDP, the HTTP/2 fingerprint is always authentic, which is an inherent advantage over tools that construct HTTP requests programmatically.

## Implications for Browser Automation

The practical takeaway for automation with Pydoll is that network fingerprinting is one area where controlling a real browser provides a significant advantage. Chrome's TCP/IP stack, TLS implementation (BoringSSL), and HTTP/2 stack produce authentic fingerprints by default. The main risk is environmental mismatch: running Chrome on a Linux server while the User-Agent claims Windows creates a TCP/IP fingerprint inconsistency (TTL 64 instead of 128, Linux TCP options order instead of Windows).

For proxy-based setups, the fingerprint flow is: your machine's TCP/IP stack generates the connection to the proxy (which the proxy's operator can see but the target cannot), and the proxy's TCP/IP stack generates the connection to the target. The target sees the proxy server's TTL and TCP options. If the proxy runs Linux (as most do), the TCP fingerprint will indicate Linux regardless of the User-Agent. This is a well-known detection signal that residential proxies partially mitigate (the proxy endpoint is a real user's machine, so its TCP fingerprint is plausible) but datacenter proxies cannot.

The TLS and HTTP/2 fingerprints, on the other hand, pass through SOCKS5 and CONNECT tunnels unmodified. These are the browser's fingerprints, not the proxy's. So with Pydoll through a CONNECT tunnel, the target sees authentic Chrome TLS and HTTP/2 fingerprints paired with the proxy's TCP/IP fingerprint. This combination is consistent with a real user browsing through a VPN or corporate proxy, which is a common and legitimate pattern.

## References

- Salesforce Engineering: TLS Fingerprinting with JA3 and JA3S - https://engineering.salesforce.com/tls-fingerprinting-with-ja3-and-ja3s-247362855967/
- FoxIO JA4+ Network Fingerprinting - https://github.com/FoxIO-LLC/ja4
- Cloudflare: JA4 Signals - https://blog.cloudflare.com/ja4-signals/
- Akamai: Passive Fingerprinting of HTTP/2 Clients (Black Hat EU 2017) - https://blackhat.com/docs/eu-17/materials/eu-17-Shuster-Passive-Fingerprinting-Of-HTTP2-Clients-wp.pdf
- p0f v3: Passive OS Fingerprinting - https://lcamtuf.coredump.cx/p0f3/
- RFC 8446: TLS 1.3 - https://datatracker.ietf.org/doc/html/rfc8446
- RFC 8701: GREASE for TLS - https://datatracker.ietf.org/doc/html/rfc8701
- RFC 6528: Defending against Sequence Number Attacks - https://datatracker.ietf.org/doc/html/rfc6528
- BrowserLeaks HTTP/2 Fingerprint - https://browserleaks.com/http2
- Stamus Networks: JA3 Fingerprints Fade as Browsers Embrace Extension Randomization - https://www.stamus-networks.com/blog/ja3-fingerprints-fade-browsers-embrace-tls-extension-randomization


================================================
FILE: docs/en/deep-dive/fundamentals/cdp.md
================================================
# Chrome DevTools Protocol (CDP)

The Chrome DevTools Protocol (CDP) is the foundation that enables Pydoll to control browsers without traditional webdrivers. Understanding how CDP works provides valuable insight into Pydoll's capabilities and internal architecture.


## What is CDP?

The Chrome DevTools Protocol is a powerful interface developed by the Chromium team that allows programmatic interaction with Chromium-based browsers. It's the same protocol used by Chrome DevTools when you inspect a webpage, but exposed as a programmable API that can be leveraged by automation tools.

At its core, CDP provides a comprehensive set of methods and events for interfacing with browser internals. This allows for fine-grained control over every aspect of the browser, from navigating between pages to manipulating the DOM, intercepting network requests, and monitoring performance metrics.

!!! info "CDP Evolution"
    The Chrome DevTools Protocol has been continuously evolving since its introduction. Google maintains and updates the protocol with each Chrome release, regularly adding new functionality and improving existing features.
    
    While the protocol was initially designed for Chrome's DevTools, its comprehensive capabilities have made it the foundation for next-generation browser automation tools like Puppeteer, Playwright, and of course, Pydoll.

## WebSocket Communication

One of the key architectural decisions in CDP is its use of WebSockets for communication. When a Chromium-based browser is started with the remote debugging flag enabled, it opens a WebSocket server on a specified port:

```
chrome --remote-debugging-port=9222
```

Pydoll connects to this WebSocket endpoint to establish a bidirectional communication channel with the browser. This connection:

1. **Remains persistent** throughout the automation session
2. **Enables real-time events** from the browser to be pushed to the client
3. **Allows commands** to be sent to the browser
4. **Supports binary data** for efficient transfer of screenshots, PDFs, and other assets

The WebSocket protocol is particularly well-suited for browser automation because it provides:

- **Low latency communication** - Necessary for responsive automation
- **Bidirectional messaging** - Essential for event-driven architecture
- **Persistent connections** - Eliminating connection setup overhead for each operation

Here's a simplified view of how Pydoll's communication with the browser works:

```mermaid
sequenceDiagram
    participant App as Pydoll Application
    participant WS as WebSocket Connection
    participant Browser as Chrome Browser

    App ->> WS: Command: navigate to URL
    WS ->> Browser: Execute navigation

    Browser -->> WS: Send page load event
    WS -->> App: Receive page load event
```

!!! info "WebSocket vs HTTP"
    Earlier browser automation protocols often relied on HTTP endpoints for communication. CDP's switch to WebSockets represents a significant architectural improvement that enables more responsive automation and real-time event monitoring.
    
    HTTP-based protocols require continuous polling to detect changes, creating overhead and delays. WebSockets allow the browser to push notifications to your automation script exactly when events occur, with minimal latency.

## Key CDP Domains

CDP is organized into logical domains, each responsible for a specific aspect of browser functionality. Some of the most important domains include:


| Domain | Responsibility | Example Use Cases |
|--------|----------------|------------------|
| **Browser** | Control of the browser application itself | Window management, browser context creation |
| **Page** | Interaction with page lifecycle | Navigation, JavaScript execution, frame management |
| **DOM** | Access to page structure | Query selectors, attribute modification, event listeners |
| **Network** | Network traffic monitoring and control | Request interception, response examination, caching |
| **Runtime** | JavaScript execution environment | Evaluate expressions, call functions, handle exceptions |
| **Input** | Simulating user interactions | Mouse movements, keyboard input, touch events |
| **Target** | Managing browser contexts and targets | Creating tabs, accessing iframes, handling popups |
| **Fetch** | Low-level network interception | Modifying requests, simulating responses, authentication |

Pydoll maps these CDP domains to a more intuitive API structure while preserving the full capabilities of the underlying protocol.

## Event-Driven Architecture

One of CDP's most powerful features is its event system. The protocol allows clients to subscribe to various events that the browser emits during normal operation. These events cover virtually every aspect of browser behavior:

- **Lifecycle events**: Page loads, frame navigation, target creation
- **DOM events**: Element changes, attribute modifications
- **Network events**: Request/response cycles, WebSocket messages
- **Execution events**: JavaScript exceptions, console messages
- **Performance events**: Metrics for rendering, scripting, and more


When you enable event monitoring in Pydoll (e.g., with `page.enable_network_events()`), the library sets up the necessary subscriptions with the browser and provides hooks for your code to react to these events.

```python
from pydoll.events.network import NetworkEvents
from functools import partial

async def on_request(page, event):
    url = event['params']['request']['url']
    print(f"Request to: {url}")

# Subscribe to network request events
await page.enable_network_events()
await page.on(NetworkEvents.REQUEST_WILL_BE_SENT, partial(on_request, page))
```

This event-driven approach allows automation scripts to react immediately to browser state changes without relying on inefficient polling or arbitrary delays.

## Performance Advantages of Direct CDP Integration

Using CDP directly, as Pydoll does, offers several performance advantages over traditional webdriver-based automation:

### 1. Elimination of Protocol Translation Layer

Traditional webdriver-based tools like Selenium use a multi-layered approach:

```mermaid
graph LR
    AS[Automation Script] --> WC[WebDriver Client]
    WC --> WS[WebDriver Server]
    WS --> B[Browser]
```

Each layer adds overhead, especially the WebDriver server, which acts as a translation layer between the WebDriver protocol and the browser's native APIs.

Pydoll's approach streamlines this to:

```mermaid
graph LR
    AS[Automation Script] --> P[Pydoll]
    P --> B[Browser via CDP]
```

This direct communication eliminates the computational and network overhead of the intermediate server, resulting in faster operations.

### 2. Efficient Command Batching

CDP allows for the batching of multiple commands in a single message, reducing the number of round trips required for complex operations. This is particularly valuable for operations that require several steps, such as finding an element and then interacting with it.

### 3. Asynchronous Operation

CDP's WebSocket-based, event-driven architecture aligns perfectly with Python's asyncio framework, enabling true asynchronous operation. This allows Pydoll to:

- Execute multiple operations concurrently
- Process events as they occur
- Avoid blocking the main thread during I/O operations

```mermaid
graph TD
    subgraph "Pydoll Async Architecture"
        EL[Event Loop]
        
        subgraph "Concurrent Tasks"
            T1[Task 1: Navigate]
            T2[Task 2: Wait for Element]
            T3[Task 3: Handle Network Events]
        end
        
        EL --> T1
        EL --> T2
        EL --> T3
        
        T1 --> WS[WebSocket Connection]
        T2 --> WS
        T3 --> WS
        
        WS --> B[Browser]
    end
```

!!! info "Async Performance Gains"
    The combination of asyncio and CDP creates a multiplicative effect on performance. In benchmark tests, Pydoll's asynchronous approach can process multiple pages in parallel with near-linear scaling, while traditional synchronous tools see diminishing returns as concurrency increases.
    
    For example, scraping 10 pages that each take 2 seconds to load might take over 20 seconds with a synchronous tool, but just over 2 seconds with Pydoll's async architecture (plus some minimal overhead).

### 4. Fine-Grained Control

CDP provides more granular control over browser behavior than the WebDriver protocol. This allows Pydoll to implement optimized strategies for common operations:

- More precise waiting conditions (vs. arbitrary timeouts)
- Direct access to browser caches and storage
- Targeted JavaScript execution in specific contexts
- Detailed network control for request optimization


## Conclusion

The Chrome DevTools Protocol forms the foundation of Pydoll's zero-webdriver approach to browser automation. By leveraging CDP's WebSocket communication, comprehensive domain coverage, event-driven architecture, and direct browser integration, Pydoll achieves superior performance and reliability compared to traditional automation tools.

In the following sections, we'll dive deeper into how Pydoll implements specific CDP domains and transforms the low-level protocol into an intuitive, developer-friendly API. 

================================================
FILE: docs/en/deep-dive/fundamentals/connection-layer.md
================================================
# Connection Handler

The Connection Handler is the foundational layer of Pydoll's architecture, serving as the bridge between your Python code and the browser's Chrome DevTools Protocol (CDP). This component manages the WebSocket connection to the browser, handles command execution, and processes events in a non-blocking, asynchronous manner.

```mermaid
graph TD
    A[Python Code] --> B[Connection Handler]
    B <--> C[WebSocket]
    C <--> D[Browser CDP Endpoint]

    subgraph "Connection Handler"
        E[Command Manager]
        F[Events Handler]
        G[WebSocket Client]
    end

    B --> E
    B --> F
    B --> G
```

## Asynchronous Programming Model

Pydoll is built on Python's `asyncio` framework, which enables non-blocking I/O operations. This design choice is critical for high-performance browser automation, as it allows multiple operations to occur concurrently without waiting for each to complete.

### Understanding Async/Await


To understand how async/await works in practice, let's examine a more detailed example with two concurrent operations:

```python
import asyncio
from pydoll.browser.chrome import Chrome

async def fetch_page_data(url):
    print(f"Starting fetch for {url}")
    browser = Chrome()
    await browser.start()
    page = await browser.get_page()
    
    # Navigation takes time - this is where we yield control
    await page.go_to(url)
    
    # Get page title
    title = await page.execute_script("return document.title")
    
    # Extract some data
    description = await page.execute_script(
        "return document.querySelector('meta[name=\"description\"]')?.content || ''"
    )
    
    await browser.stop()
    print(f"Completed fetch for {url}")
    return {"url": url, "title": title, "description": description}

async def main():
    # Start two page operations concurrently
    task1 = asyncio.create_task(fetch_page_data("https://example.com"))
    task2 = asyncio.create_task(fetch_page_data("https://github.com"))
    
    # Wait for both to complete and get results
    result1 = await task1
    result2 = await task2
    
    return [result1, result2]

# Run the async function
results = asyncio.run(main())
```

This example demonstrates how we can fetch data from two different websites concurrently, potentially cutting the overall execution time nearly in half compared to sequential execution.

#### Async Execution Flow Diagram

Here's what happens in the event loop when executing the code above:

```mermaid
sequenceDiagram
    participant A as Main Code
    participant B as Task 1<br/> (example.com)
    participant C as Task 2<br/> (github.com)
    participant D as Event Loop
    
    A->>B: Create task1
    B->>D: Register in loop
    A->>C: Create task2
    C->>D: Register in loop
    D->>B: Execute until browser.start()
    D->>C: Execute until browser.start()
    D-->>B: Resume after WebSocket connected
    D-->>C: Resume after WebSocket connected
    D->>B: Execute until page.go_to()
    D->>C: Execute until page.go_to()
    D-->>B: Resume after page loaded
    D-->>C: Resume after page loaded
    B-->>A: Return result
    C-->>A: Return result
```

This sequence diagram illustrates how Python's asyncio manages the two concurrent tasks in our example code:

1. The main function creates two tasks for fetching data from different websites
2. Both tasks are registered in the event loop
3. The event loop executes each task until it hits an `await` statement (like `browser.start()`)
4. When async operations complete (like a WebSocket connection being established), tasks resume
5. The loop continues to switch between tasks at each `await` point
6. When each task completes, it returns its result back to the main function

In the `fetch_page_data` example, this allows both browser instances to work concurrently - while one is waiting for a page to load, the other can be making progress. This is significantly more efficient than sequentially processing each website, as I/O wait times don't block the execution of other tasks.

!!! info "Cooperative Multitasking"
    Asyncio uses cooperative multitasking, where tasks voluntarily yield control at `await` points. This differs from preemptive multitasking (threads), where tasks can be interrupted at any time. Cooperative multitasking can provide better performance for I/O-bound operations but requires careful coding to avoid blocking the event loop.

## Connection Handler Implementation

The `ConnectionHandler` class is designed to manage both command execution and event processing, providing a robust interface to the CDP WebSocket connection.

### Class Initialization

```python
def __init__(
    self,
    connection_port: int,
    page_id: str = 'browser',
    ws_address_resolver: Callable[[int], str] = get_browser_ws_address,
    ws_connector: Callable = websockets.connect,
):
    # Initialize components...
```

The ConnectionHandler accepts several parameters:

| Parameter | Type | Description |
|-----------|------|-------------|
| `connection_port` | `int` | Port number where the browser's CDP endpoint is listening |
| `page_id` | `str` | Identifier for the specific page/target (use 'browser' for browser-level connections) |
| `ws_address_resolver` | `Callable` | Function to resolve the WebSocket URL from the port number |
| `ws_connector` | `Callable` | Function to establish the WebSocket connection |

### Internal Components

The ConnectionHandler orchestrates three primary components:

1. **WebSocket Connection**: Manages the actual WebSocket communication with the browser
2. **Command Manager**: Handles sending commands and receiving responses
3. **Events Handler**: Processes events from the browser and triggers appropriate callbacks

```mermaid
classDiagram
    class ConnectionHandler {
        -_connection_port: int
        -_page_id: str
        -_ws_connection
        -_command_manager: CommandManager
        -_events_handler: EventsHandler
        +execute_command(command, timeout) async
        +register_callback(event_name, callback) async
        +remove_callback(callback_id) async
        +ping() async
        +close() async
        -_receive_events() async
    }

    class CommandManager {
        -_pending_commands: dict
        +create_command_future(command)
        +resolve_command(id, response)
        +remove_pending_command(id)
    }

    class EventsHandler {
        -_callbacks: dict
        -_network_logs: list
        -_dialog: dict
        +register_callback(event_name, callback, temporary)
        +remove_callback(callback_id)
        +clear_callbacks()
        +process_event(event) async
    }

    ConnectionHandler *-- CommandManager
    ConnectionHandler *-- EventsHandler
```

## Command Execution Flow

When executing a command through the CDP, the ConnectionHandler follows a specific pattern:

1. Ensure an active WebSocket connection exists
2. Create a Future object to represent the pending response
3. Send the command over the WebSocket
4. Await the Future to be resolved with the response
5. Return the response to the caller

```python
async def execute_command(self, command: dict, timeout: int = 10) -> dict:
    # Validate command
    if not isinstance(command, dict):
        logger.error('Command must be a dictionary.')
        raise exceptions.InvalidCommand('Command must be a dictionary')

    # Ensure connection is active
    await self._ensure_active_connection()
    
    # Create future for this command
    future = self._command_manager.create_command_future(command)
    command_str = json.dumps(command)

    # Send command and await response
    try:
        await self._ws_connection.send(command_str)
        response: str = await asyncio.wait_for(future, timeout)
        return json.loads(response)
    except asyncio.TimeoutError as exc:
        self._command_manager.remove_pending_command(command['id'])
        raise exc
    except websockets.ConnectionClosed as exc:
        await self._handle_connection_loss()
        raise exc
```

!!! warning "Command Timeout"
    Commands that don't receive a response within the specified timeout period will raise a `TimeoutError`. This prevents automation scripts from hanging indefinitely due to missing responses. The default timeout is 10 seconds, but can be adjusted based on expected response times for complex operations.

## Event Processing System

The event system is a key architectural component that enables reactive programming patterns in Pydoll. It allows you to register callbacks for specific browser events and have them executed automatically when those events occur.

### Event Flow

The event processing flow follows these steps:

1. The `_receive_events` method runs as a background task, continuously receiving messages from the WebSocket
2. Each message is parsed and classified as either a command response or an event
3. Events are passed to the EventsHandler for processing
4. The EventsHandler identifies registered callbacks for the event and invokes them

```mermaid
flowchart TD
    A[WebSocket Message] --> B{Is Command Response?}
    B -->|Yes| C[Resolve Command Future]
    B -->|No| D[Process as Event]
    D --> E[Find Matching Callbacks]
    E --> F[Execute Callbacks]
    F --> G{Is Temporary?}
    G -->|Yes| H[Remove Callback]
    G -->|No| I[Keep Callback]
```

### Callback Registration

The ConnectionHandler provides methods to register, remove, and manage event callbacks:

```python
# Register a callback for a specific event
callback_id = await connection.register_callback(
    'Page.loadEventFired', 
    handle_page_load
)

# Remove a specific callback
await connection.remove_callback(callback_id)

# Remove all callbacks
await connection.clear_callbacks()
```

!!! tip "Temporary Callbacks"
    You can register a callback as temporary, which means it will be automatically removed after being triggered once. This is useful for one-time events like dialog handling:
    
    ```python
    await connection.register_callback(
        'Page.javascriptDialogOpening',
        handle_dialog,
        temporary=True
    )
    ```

### Asynchronous Callback Execution

Callbacks can be either synchronous functions or asynchronous coroutines. The EventsHandler (managed by the ConnectionHandler) handles both types properly:

```python
# Synchronous callback
def synchronous_callback(event):
    print(f"Event received: {event['method']}")

# Asynchronous callback
async def asynchronous_callback(event):
    await asyncio.sleep(0.1)  # Perform some async operation
    print(f"Event processed asynchronously: {event['method']}")

# Both can be registered the same way
await connection.register_callback('Network.requestWillBeSent', synchronous_callback)
await connection.register_callback('Network.responseReceived', asynchronous_callback)
```

**Sequential Execution Model:**

Asynchronous callbacks are **awaited sequentially** by the EventsManager. This ensures that for a single event, callbacks execute in the order they were registered, preventing race conditions when multiple callbacks modify shared state.

```python
# Inside EventsManager.process_event()
for callback_data in callbacks:
    if asyncio.iscoroutinefunction(callback_data['callback']):
        await callback_data['callback'](event_data)  # Sequential await
    else:
        callback_data['callback'](event_data)  # Sync execution
```

**Non-blocking execution** (for UI callbacks that should not block other operations) is achieved at a **higher level**, such as in the `Tab.on()` method, which wraps the user's callback in an `asyncio.create_task()` before registering it here. This architecture provides:

- **Lower layer** (ConnectionHandler/EventsManager): Guarantees sequential execution and predictable order
- **Higher layer** (Tab.on()): Provides non-blocking semantics when needed

!!! info "Event Architecture Details"
    See [Event Architecture Deep Dive](../architecture/event-architecture.md) for complete details on the multi-layer event system and the rationale behind sequential callback execution.

## Connection Management

The ConnectionHandler implements several strategies to ensure robust connections:

### Lazy Connection Establishment

Connections are established only when needed, typically when the first command is executed or when explicitly requested. This lazy initialization approach conserves resources and allows for more flexible connection management.

### Automatic Reconnection

If the WebSocket connection is lost or closed unexpectedly, the ConnectionHandler will attempt to re-establish it automatically when the next command is executed. This provides resilience against transient network issues.

```python
async def _ensure_active_connection(self):
    """
    Guarantees that an active connection exists before proceeding.
    """
    if self._ws_connection is None or self._ws_connection.closed:
        await self._establish_new_connection()
```

### Resource Cleanup

The ConnectionHandler implements both explicit cleanup methods and Python's asynchronous context manager protocol (`__aenter__` and `__aexit__`), ensuring resources are properly released when no longer needed:

```python
async def close(self):
    """
    Closes the WebSocket connection and clears all callbacks.
    """
    await self.clear_callbacks()
    if self._ws_connection is not None:
        try:
            await self._ws_connection.close()
        except websockets.ConnectionClosed as e:
            logger.info(f'WebSocket connection has closed: {e}')
        logger.info('WebSocket connection closed.')
```

!!! info "Context Manager Usage"
    Using the ConnectionHandler as a context manager is the recommended pattern for ensuring proper resource cleanup:
    
    ```python
    async with ConnectionHandler(9222, 'browser') as connection:
        # Work with the connection...
        await connection.execute_command(...)
    # Connection is automatically closed when exiting the context
    ```

## Message Processing Pipeline

The ConnectionHandler implements a sophisticated message processing pipeline that handles the continuous stream of messages from the WebSocket connection:

```mermaid
sequenceDiagram
    participant WS as WebSocket
    participant RCV as _receive_events
    participant MSG as _process_single_message
    participant PARSE as _parse_message
    participant CMD as _handle_command_message
    participant EVT as _handle_event_message
    
    loop While connected
        WS->>RCV: message
        RCV->>MSG: raw_message
        MSG->>PARSE: raw_message
        PARSE-->>MSG: parsed JSON or None
        
        alt Is command response
            MSG->>CMD: message
            CMD->>CMD: resolve command future
        else Is event notification
            MSG->>EVT: message
            EVT->>EVT: process event & trigger callbacks
        end
    end
```

This pipeline ensures efficient processing of both command responses and asynchronous events, allowing Pydoll to maintain responsive operation even under high message volume.

## Advanced Usage

The ConnectionHandler is usually used indirectly through the Browser and Page classes, but it can also be used directly for advanced scenarios:

### Direct Event Monitoring

For specialized use cases, you might want to bypass the higher-level APIs and directly monitor specific CDP events:

```python
from pydoll.connection.connection import ConnectionHandler

async def monitor_network():
    connection = ConnectionHandler(9222)
    
    async def log_request(event):
        url = event['params']['request']['url']
        print(f"Request: {url}")
    
    await connection.register_callback(
        'Network.requestWillBeSent', 
        log_request
    )
    
    # Enable network events via CDP command
    await connection.execute_command({
        "id": 1,
        "method": "Network.enable"
    })
    
    # Keep running until interrupted
    try:
        while True:
            await asyncio.sleep(1)
    finally:
        await connection.close()
```

### Custom Command Execution

You can execute arbitrary CDP commands directly:

```python
async def custom_cdp_command(connection, method, params=None):
    command = {
        "id": random.randint(1, 10000),
        "method": method,
        "params": params or {}
    }
    return await connection.execute_command(command)

# Example: Get document HTML without using Page class
async def get_html(connection):
    result = await custom_cdp_command(
        connection,
        "Runtime.evaluate",
        {"expression": "document.documentElement.outerHTML"}
    )
    return result['result']['result']['value']
```

!!! warning "Advanced Interface"
    Direct use of the ConnectionHandler requires a deep understanding of the Chrome DevTools Protocol. For most use cases, the higher-level Browser and Page APIs provide a more intuitive and safer interface.


## Advanced Concurrency Patterns

The ConnectionHandler's asynchronous design enables sophisticated concurrency patterns:

### Parallel Command Execution

Execute multiple commands concurrently and wait for all results:

```python
async def get_page_metrics(connection):
    commands = [
        {"id": 1, "method": "Performance.getMetrics"},
        {"id": 2, "method": "Network.getResponseBody", "params": {"requestId": "..."}},
        {"id": 3, "method": "DOM.getDocument"}
    ]
    
    results = await asyncio.gather(
        *(connection.execute_command(cmd) for cmd in commands)
    )
    
    return results
```

## Conclusion

The ConnectionHandler serves as the foundation of Pydoll's architecture, providing a robust, efficient interface to the Chrome DevTools Protocol. By leveraging Python's asyncio framework and WebSocket communication, it enables high-performance browser automation with elegant, event-driven programming patterns.

Understanding the ConnectionHandler's design and operation provides valuable insights into Pydoll's internal workings and offers opportunities for advanced customization and optimization in specialized scenarios.

For most use cases, you'll interact with the ConnectionHandler indirectly through the higher-level Browser and Page APIs, which provide a more intuitive interface while leveraging the ConnectionHandler's powerful capabilities. 

================================================
FILE: docs/en/deep-dive/fundamentals/iframes-and-contexts.md
================================================
# Iframes, OOPIFs and Execution Contexts (Deep Dive)

Understanding how browser automation handles iframes is critical for building robust automation tools. This comprehensive guide explores the technical foundations of iframe handling in Pydoll, covering the Document Object Model (DOM), Chrome DevTools Protocol (CDP) mechanics, execution contexts, isolated worlds, and the sophisticated resolution pipeline that makes iframe interaction seamless.

!!! info "Practical usage first"
    If you just need to use iframes in your automation scripts, start with the feature guide: **Features → Automation → IFrames**.  
    This deep dive explains the architectural decisions, protocol nuances, and internal implementation details.

---

## Table of Contents

1. [Foundation: The Document Object Model (DOM)](#foundation-the-document-object-model-dom)
2. [What are Iframes and Why They Matter](#what-are-iframes-and-why-they-matter)
3. [The Challenge: Out-of-Process Iframes (OOPIFs)](#the-challenge-out-of-process-iframes-oopifs)
4. [Chrome DevTools Protocol and Frame Management](#chrome-devtools-protocol-and-frame-management)
5. [Execution Contexts and Isolated Worlds](#execution-contexts-and-isolated-worlds)
6. [CDP Identifiers Reference](#cdp-identifiers-reference)
7. [Pydoll's Resolution Pipeline](#pydolls-resolution-pipeline)
8. [Session Routing and Flattened Mode](#session-routing-and-flattened-mode)
9. [Implementation Deep Dive](#implementation-deep-dive)
10. [Performance Considerations](#performance-considerations)
11. [Failure Modes and Debugging](#failure-modes-and-debugging)

---

## Foundation: The Document Object Model (DOM)

Before diving into iframes, we must understand the DOM—the tree structure that represents an HTML document in memory.

### What is the DOM?

The **Document Object Model** is a programming interface for HTML and XML documents. It represents the page structure as a tree of nodes, where each node corresponds to a part of the document:

- **Element nodes**: HTML tags like `<div>`, `<iframe>`, `<button>`
- **Text nodes**: The actual text content
- **Attribute nodes**: Element attributes like `id`, `class`, `src`
- **Document node**: The root of the tree

```mermaid
graph TD
    Document[Document] --> HTML[html element]
    HTML --> Head[head element]
    HTML --> Body[body element]
    Body --> Div1[div element]
    Body --> Div2[div element]
    Div1 --> Text1[text node: 'Hello']
    Div2 --> Iframe[iframe element]
    Iframe --> IframeDoc[iframe's document]
    IframeDoc --> IframeBody[iframe body]
    IframeBody --> IframeContent[iframe content...]
```

### DOM Tree Properties

1. **Hierarchical structure**: Every node has a parent (except Document) and can have children
2. **Node identification**: Nodes can be identified by:
   - `nodeId`: Internal identifier within a document context (DOM domain)
   - `backendNodeId`: Stable identifier that can reference nodes across different documents
3. **Live representation**: Changes to the DOM are reflected immediately in the tree

### Why This Matters for Iframes

Each `<iframe>` element creates a **new, independent DOM tree**. The iframe element itself exists in the parent's DOM, but the content loaded into the iframe has its own complete Document node and tree structure. This separation is the foundation of all iframe complexity.

---

## What are Iframes and Why They Matter

### Definition

An **iframe** (inline frame) is an HTML element (`<iframe>`) that embeds another HTML document within the current page. The embedded document maintains its own context, including:

- Independent HTML structure and DOM tree
- Separate JavaScript execution environment
- Its own CSS styling (unless explicitly shared)
- Distinct navigation history

```html
<body>
  <h1>Parent Page</h1>
  <iframe src="https://example.com/embedded.html" id="content-frame"></iframe>
  <p>More parent content</p>
</body>
```

### Common Use Cases

| Use Case | Description | Example |
|----------|-------------|---------|
| **Third-party widgets** | Embed external content safely | Payment forms, social media feeds, chat widgets |
| **Content isolation** | Sandbox untrusted content | User-generated HTML, advertisements |
| **Modular architecture** | Reusable components | Dashboard widgets, plugin systems |
| **Cross-origin content** | Load resources from different domains | Maps, video players, analytics dashboards |

### Security Model: Same-Origin Policy

The browser enforces a **Same-Origin Policy** for iframes:

- **Same-origin iframes**: Parent can access iframe's DOM via JavaScript (`iframe.contentDocument`)
- **Cross-origin iframes**: Parent cannot access iframe's DOM directly (security restriction)

This security boundary is why automation tools need special mechanisms (like CDP) to interact with iframe content.

!!! warning "Important for automation"
    Traditional JavaScript-based automation (like Selenium's early approaches) cannot directly access cross-origin iframe content due to browser security. CDP operates at a lower level, bypassing this limitation for debugging purposes.

---

## The Challenge: Out-of-Process Iframes (OOPIFs)

### What are OOPIFs?

Modern Chromium uses **site isolation** for security and stability. This means different origins may be rendered in separate OS processes. An iframe from a different origin becomes an **Out-of-Process Iframe (OOPIF)**.

```mermaid
graph LR
    subgraph "Process 1: example.com"
        MainPage[Main Page DOM]
    end
    
    subgraph "Process 2: widget.com"
        IframeDOM[Iframe DOM]
    end
    
    MainPage -.Process boundary.-> IframeDOM
```

### Why OOPIFs Complicate Automation

| Aspect | In-Process Iframe | Out-of-Process Iframe (OOPIF) |
|--------|-------------------|-------------------------------|
| **DOM access** | Shared document tree in memory | Separate target with own document |
| **Command routing** | Single connection | Requires target attachment and session routing |
| **Frame tree** | All frames in one tree | Root frame + separate targets for OOPIFs |
| **JavaScript context** | Same execution context | Different execution context per process |
| **CDP communication** | Direct commands | Commands must include `sessionId` |

### The Traditional Approach (Manual Context Switching)

Without sophisticated handling, automating OOPIFs requires:

```python
# Traditional (manual) approach with other tools
main_page = browser.get_page()
iframe_element = main_page.find_element_by_id("iframe-id")

# Must manually switch context
driver.switch_to.frame(iframe_element)

# Now commands target the iframe
button = driver.find_element_by_id("button-in-iframe")
button.click()

# Must manually switch back
driver.switch_to.default_content()
```

**Problems with this approach:**

1. **Developer burden**: Every iframe requires explicit context management
2. **Nested iframes**: Each level needs another switch
3. **OOPIF detection**: Hard to know when manual attachment is needed
4. **Error-prone**: Forget to switch back → subsequent commands fail
5. **Not composable**: Helper functions must know their iframe context

### Pydoll's Solution: Transparent Context Resolution

Pydoll eliminates manual context switching by resolving iframe contexts automatically:

```python
# Pydoll approach (no manual switching)
iframe = await tab.find(id="iframe-id")
button = await iframe.find(id="button-in-iframe")
await button.click()

# Nested iframes? Same pattern
outer = await tab.find(id="outer-iframe")
inner = await outer.find(tag_name="iframe")
button = await inner.find(text="Submit")
await button.click()
```

The complexity is handled internally. Let's explore how.

---

## Chrome DevTools Protocol and Frame Management

As discussed in [Deep Dive → Fundamentals → Chrome DevTools Protocol](./cdp.md), CDP provides comprehensive browser control via WebSocket communication. Frame management is spread across multiple CDP domains.

### Relevant CDP Domains

#### 1. **Page Domain**

Manages page lifecycle, frames, and navigation.

**Key methods:**

- `Page.getFrameTree()`: Returns the hierarchical structure of all frames in a page
  ```json
  {
    "frameTree": {
      "frame": {
        "id": "main-frame-id",
        "url": "https://example.com",
        "securityOrigin": "https://example.com",
        "mimeType": "text/html"
      },
      "childFrames": [
        {
          "frame": {
            "id": "child-frame-id",
            "parentId": "main-frame-id",
            "url": "https://widget.com/embed"
          }
        }
      ]
    }
  }
  ```

- `Page.createIsolatedWorld(frameId, worldName)`: Creates a new JavaScript execution context in a specific frame
  ```json
  {
    "executionContextId": 42
  }
  ```

**Pydoll usage:** 

```python
# From pydoll/elements/web_element.py
@staticmethod
async def _get_frame_tree_for(
    handler: ConnectionHandler, session_id: Optional[str]
) -> FrameTree:
    """Get the Page frame tree for the given connection/target."""
    command = PageCommands.get_frame_tree()
    if session_id:
        command['sessionId'] = session_id
    response: GetFrameTreeResponse = await handler.execute_command(command)
    return response['result']['frameTree']
```

#### 2. **DOM Domain**

Provides access to the DOM structure.

**Key methods:**

- `DOM.describeNode(objectId)`: Returns detailed information about a DOM node
  ```json
  {
    "node": {
      "nodeId": 123,
      "backendNodeId": 456,
      "nodeName": "IFRAME",
      "frameId": "parent-frame-id",
      "contentDocument": {
        "frameId": "iframe-frame-id",
        "documentURL": "https://embedded.com/page.html"
      }
    }
  }
  ```

- `DOM.getFrameOwner(frameId)`: Returns the `backendNodeId` of the `<iframe>` element that owns a frame
  ```json
  {
    "backendNodeId": 456
  }
  ```

**Pydoll usage:**

```python
# From pydoll/elements/web_element.py
@staticmethod
async def _owner_backend_for(
    handler: ConnectionHandler, session_id: Optional[str], frame_id: str
) -> Optional[int]:
    """Get the backendNodeId of the DOM element that owns the given frame."""
    command = DomCommands.get_frame_owner(frame_id=frame_id)
    if session_id:
        command['sessionId'] = session_id
    response: GetFrameOwnerResponse = await handler.execute_command(command)
    return response.get('result', {}).get('backendNodeId')
```

#### 3. **Target Domain**

Manages browser targets (pages, iframes, workers, etc.).

**Key methods:**

- `Target.getTargets()`: Lists all available targets
  ```json
  {
    "targetInfos": [
      {
        "targetId": "page-target-id",
        "type": "page",
        "title": "Main Page",
        "url": "https://example.com"
      },
      {
        "targetId": "iframe-target-id",
        "type": "iframe",
        "title": "",
        "url": "https://widget.com/embed",
        "parentFrameId": "main-frame-id"
      }
    ]
  }
  ```

- `Target.attachToTarget(targetId, flatten)`: Attaches to a target for debugging
  - When `flatten=true`: Returns a `sessionId` for routing commands in flattened mode
  - All communication happens over the same WebSocket, differentiated by `sessionId`

**Pydoll usage:**

```python
# From pydoll/interactions/iframe.py (simplified)
async def _resolve_oopif_by_parent(self, content_frame_id: str, ...):
    """Resolve an OOPIF using the content frame id."""
    browser_handler = ConnectionHandler(...)
    targets_response: GetTargetsResponse = await browser_handler.execute_command(
        TargetCommands.get_targets()
    )
    target_infos = targets_response.get('result', {}).get('targetInfos', [])

    # Find targets whose parentFrameId matches
    direct_children = [
        target_info for target_info in target_infos
        if target_info.get('parentFrameId') == content_frame_id
    ]
    
    if direct_children:
        attach_response: AttachToTargetResponse = await browser_handler.execute_command(
            TargetCommands.attach_to_target(
                target_id=direct_children[0]['targetId'], 
                flatten=True
            )
        )
        attached_session_id = attach_response.get('result', {}).get('sessionId')
        # ... use session_id for subsequent commands
```

#### 4. **Runtime Domain**

Executes JavaScript and manages execution contexts.

**Key methods:**

- `Runtime.evaluate(expression, contextId)`: Evaluates JavaScript in a specific execution context
- `Runtime.callFunctionOn(functionDeclaration, objectId)`: Calls a function with a specific object as `this`

**Pydoll usage for iframe document access:**

```python
# From pydoll/elements/web_element.py
async def _set_iframe_document_object_id(self, execution_context_id: int):
    """Evaluate document.documentElement in iframe context and cache its object id."""
    evaluate_command = RuntimeCommands.evaluate(
        expression='document.documentElement',
        context_id=execution_context_id,
    )
    if self._iframe_context and self._iframe_context.session_id:
        evaluate_command['sessionId'] = self._iframe_context.session_id
    
    evaluate_response: EvaluateResponse = await (
        (self._iframe_context.session_handler if self._iframe_context else None)
        or self._connection_handler
    ).execute_command(evaluate_command)
    
    document_object_id = evaluate_response.get('result', {}).get('result', {}).get('objectId')
    if self._iframe_context:
        self._iframe_context.document_object_id = document_object_id
```

---

## Execution Contexts and Isolated Worlds

### What is an Execution Context?

An **execution context** is an environment where JavaScript code is executed. Every frame in a browser has at least one execution context. The context includes:

- **Global object** (`window` in browsers)
- **Scope chain**: How variables are resolved
- **This binding**: What `this` refers to
- **Variable environment**: All declared variables and functions

### Multiple Contexts per Frame

A single frame can have multiple execution contexts:

1. **Main world (default context)**: Where the page's own JavaScript runs
2. **Isolated worlds**: Separate contexts that share the same DOM but have different JavaScript global scopes

```mermaid
graph TB
    Frame[Frame: example.com/page]
    Frame --> MainWorld[Main World<br/>Page's JavaScript]
    Frame --> IsolatedWorld1[Isolated World 1<br/>Extension content script]
    Frame --> IsolatedWorld2[Isolated World 2<br/>Pydoll automation]
    
    DOM[Shared DOM Tree]
    MainWorld -.can access.-> DOM
    IsolatedWorld1 -.can access.-> DOM
    IsolatedWorld2 -.can access.-> DOM
    
    MainWorld -.cannot access.-> IsolatedWorld1
    MainWorld -.cannot access.-> IsolatedWorld2
```

### What is an Isolated World?

An **isolated world** is a separate JavaScript execution context that:

- **Shares the same DOM**: Can read/modify DOM elements
- **Has a separate global object**: Variables/functions don't leak between worlds
- **Prevents interference**: Page scripts cannot detect or interfere with isolated world scripts

**Origin**: Isolated worlds were created for browser extensions. Content scripts run in isolated worlds so they can interact with the page DOM without:

- Page scripts overwriting their variables
- Being detected by anti-tamper code
- Conflicting with page JavaScript

### Why Pydoll Uses Isolated Worlds for Iframes

When Pydoll interacts with iframe content, it creates an isolated world in that iframe's context. This provides:

1. **Clean JavaScript environment**: No conflicts with iframe's own scripts
2. **Consistent behavior**: Automation scripts work regardless of what JavaScript the iframe runs
3. **Anti-detection**: The iframe's JavaScript cannot easily detect Pydoll's presence
4. **Safe evaluation**: Automation code cannot accidentally trigger page logic

**Implementation:**

```python
# From pydoll/elements/web_element.py
@staticmethod
async def _create_isolated_world_for_frame(
    frame_id: str,
    handler: ConnectionHandler,
    session_id: Optional[str],
) -> int:
    """Create an isolated world (Page.createIsolatedWorld) for the given frame."""
    create_command = PageCommands.create_isolated_world(
        frame_id=frame_id,
        world_name=f'pydoll::iframe::{frame_id}',
        grant_universal_access=True,
    )
    if session_id:
        create_command['sessionId'] = session_id
    
    create_response: CreateIsolatedWorldResponse = await handler.execute_command(
        create_command
    )
    execution_context_id = create_response.get('result', {}).get('executionContextId')
    if not execution_context_id:
        raise InvalidIFrame('Unable to create isolated world for iframe')
    return execution_context_id
```

The `grant_universal_access=True` parameter allows the isolated world to:

- Access cross-origin frames (normally blocked by same-origin policy)
- Perform privileged operations needed for automation

!!! tip "Isolated worlds in practice"
    Every time you use `await iframe.find(...)`, Pydoll evaluates the selector query in an isolated world created specifically for that iframe. This ensures your automation logic never conflicts with the iframe's own JavaScript, and the iframe cannot detect or block your automation.

---

## CDP Identifiers Reference

Understanding CDP identifiers is crucial for iframe handling. Here's a comprehensive reference:

| Identifier | Domain | Scope | Purpose | Example Use in Pydoll |
|------------|--------|-------|---------|----------------------|
| **`nodeId`** | DOM | Document-local | Identifies a DOM node within a specific document context | Internal CDP operations; not stable across navigations |
| **`backendNodeId`** | DOM | Cross-document stable | Stable identifier for a DOM node; can map frames to owner elements | Used to match iframe elements to frame IDs via `DOM.getFrameOwner` |
| **`frameId`** | Page | Frame | Identifies a frame in the page's frame tree | Used to specify which frame for `Page.createIsolatedWorld` and frame tree traversal |
| **`targetId`** | Target | Global | Identifies a debugging target (page, iframe, worker, etc.) | Used for `Target.attachToTarget` to connect to OOPIFs |
| **`sessionId`** | Target | Target-specific | Routes commands to a specific target in flattened mode | Injected into commands to route them to the correct OOPIF |
| **`executionContextId`** | Runtime | Frame + world | Identifies a JavaScript execution context (including isolated worlds) | Returned by `Page.createIsolatedWorld`; used in `Runtime.evaluate` |
| **`objectId`** | Runtime | Execution context | Remote object reference (e.g., DOM element, function, object) | Reference to iframe's `document.documentElement` for relative queries |

### Identifier Relationships

Here's how identifiers relate to each other during iframe resolution:

```
┌─────────────────────────────────────────────────────────────────────────┐
│                         Resolution Flow                                 │
└─────────────────────────────────────────────────────────────────────────┘

1. Start: <iframe> Element
   └─ backendNodeId: 789
   
2. Find Frame ──────────────[DOM.getFrameOwner]──────────────┐
   └─ frameId: abc-123                                       │
                                                             │
3. OOPIF? Check Origin ─────[Different origin detected]──────┤
   └─ targetId: xyz-456                                      │
                                                             │
4. Attach to Target ────────[Target.attachToTarget]──────────┤
   └─ sessionId: session-789                                 │
                                                             │
5. Create Isolated World ───[Page.createIsolatedWorld]───────┤
   └─ executionContextId: 42                                 │
                                                             │
6. Get Document ────────────[Runtime.evaluate]───────────────┘
   └─ objectId: obj-999
```

**Key transformation points:**

| From | Method | To | Purpose |
|------|--------|-----|---------|
| `backendNodeId` | `DOM.getFrameOwner` | `frameId` | Find which frame owns the iframe element |
| `targetId` | `Target.attachToTarget(flatten=true)` | `sessionId` | Connect to OOPIF for command routing |
| `frameId` | `Page.createIsolatedWorld` | `executionContextId` | Create safe JavaScript environment |
| `executionContextId` | `Runtime.evaluate('document.documentElement')` | `objectId` | Get reference to iframe's document |

### Code Representation in Pydoll

```python
# From pydoll/elements/web_element.py
@dataclass
class _IFrameContext:
    """Encapsulates all identifiers and routing information for an iframe."""
    frame_id: str                                   # frameId: identifies the frame
    document_url: Optional[str] = None              # frame's loaded URL
    execution_context_id: Optional[int] = None      # executionContextId: isolated world
    document_object_id: Optional[str] = None        # objectId: document.documentElement
    session_handler: Optional[ConnectionHandler] = None  # for OOPIF targets
    session_id: Optional[str] = None                # sessionId: routes commands to OOPIF
```

This dataclass is cached on each `WebElement` representing an iframe, enabling automatic routing of all subsequent operations.

---

## Pydoll's Resolution Pipeline

When you access an iframe in Pydoll (e.g., `await iframe.find(...)`), an elaborate resolution pipeline executes behind the scenes. This section breaks down every step.

### High-Level Flow

```mermaid
sequenceDiagram
    participant User
    participant WebElement
    participant Pipeline as Resolution Pipeline
    participant CDP
    
    User->>WebElement: iframe.find(id='button')
    WebElement->>WebElement: Check if iframe context cached
    alt Context not cached
        WebElement->>Pipeline: _ensure_iframe_context()
        Pipeline->>CDP: DOM.describeNode(iframe)
        CDP-->>Pipeline: Node info (frameId?, backendNodeId, etc.)
        
        alt frameId not in node info
            Pipeline->>Pipeline: _resolve_frame_by_owner()
            Pipeline->>CDP: Page.getFrameTree()
            CDP-->>Pipeline: Frame tree
            Pipeline->>CDP: DOM.getFrameOwner(each frame)
            CDP-->>Pipeline: backendNodeId
            Pipeline->>Pipeline: Match backendNodeId to find frameId
        end
        
        alt frameId still missing (OOPIF)
            Pipeline->>Pipeline: _resolve_oopif_by_parent()
            Pipeline->>CDP: Target.getTargets()
            CDP-->>Pipeline: List of targets
            Pipeline->>CDP: Target.attachToTarget(targetId, flatten=true)
            CDP-->>Pipeline: sessionId
            Pipeline->>CDP: Page.getFrameTree(sessionId)
            CDP-->>Pipeline: OOPIF frame tree
        end
        
        Pipeline->>CDP: Page.createIsolatedWorld(frameId)
        CDP-->>Pipeline: executionContextId
        
        Pipeline->>CDP: Runtime.evaluate('document.documentElement', contextId)
        CDP-->>Pipeline: objectId (document reference)
        
        Pipeline->>WebElement: Cache _IFrameContext
    end
    
    WebElement->>WebElement: Use cached context for find()
    WebElement-->>User: Button element (with context)
```

### Step-by-Step Deep Dive

#### **Step 1: Describe the Iframe Element**

**Goal**: Extract metadata from the `<iframe>` DOM element.

**Method**: `DOM.describeNode(objectId=iframe_object_id)`

**What we get**:

- `backendNodeId`: Stable identifier for the iframe element
- `frameId` (from `contentDocument`): If the iframe's content is already loaded and in-process
- `documentURL`: The URL loaded in the iframe
- `parentFrameId` (from `frameId` field on the node): The frame containing this iframe element

**Code**:

```python
# From pydoll/interactions/iframe.py
async def resolve(self) -> IFrameContext:
    """Resolve and return iframe context."""
    base_handler, base_session_id = self._get_base_session()
    node_info = await self._describe_element_node(base_handler, base_session_id)
    frame_id, document_url, content_frame_id, backend_node_id = self._extract_frame_metadata(
        node_info
    )
    # ... continue resolution
```

**Helper**:

```python
@staticmethod
def _extract_frame_metadata(
    node_info: Node,
) -> tuple[Optional[str], Optional[str], Optional[str], Optional[int]]:
    """Extract iframe-related metadata from a DOM.describeNode Node."""
    content_document = node_info.get('contentDocument') or {}
    content_frame_id = node_info.get('frameId')
    backend_node_id = node_info.get('backendNodeId')
    frame_id = content_document.get('frameId')
    document_url = (
        content_document.get('documentURL')
        or content_document.get('baseURL')
        or node_info.get('documentURL')
        or node_info.get('baseURL')
    )
    return frame_id, document_url, content_frame_id, backend_node_id
```

**Outcome**:

- **If `frame_id` is present**: Great! The iframe is in-process; proceed to Step 4.
- **If `frame_id` is missing**: The iframe might be an OOPIF or not fully loaded; proceed to Step 2.

---

#### **Step 2: Resolve Frame by Owner (backendNodeId matching)**

**Goal**: Find the `frameId` by matching the iframe element's `backendNodeId` to frame owners in the frame tree.

**Strategy**:

1. Fetch the page's frame tree (`Page.getFrameTree`)
2. For each frame in the tree, call `DOM.getFrameOwner(frameId)` to get the `backendNodeId` of the owning iframe element
3. Compare with our iframe's `backendNodeId`
4. When they match, we've found the correct `frameId`

**Code**:

```python
# From pydoll/elements/web_element.py
async def _resolve_frame_by_owner(
    self,
    base_handler: ConnectionHandler,
    base_session_id: Optional[str],
    backend_node_id: int,
    current_document_url: Optional[str],
) -> tuple[Optional[str], Optional[str]]:
    """Resolve a frame id and URL by matching the owner backend_node_id."""
    owner_frame_id, owner_url = await self._find_frame_by_owner(
        base_handler, base_session_id, backend_node_id
    )
    if not owner_frame_id:
        return None, current_document_url
    return owner_frame_id, owner_url or current_document_url

async def _find_frame_by_owner(
    self, handler: ConnectionHandler, session_id: Optional[str], backend_node_id: int
) -> tuple[Optional[str], Optional[str]]:
    """Find a frame by matching the owner backend_node_id of the <iframe> element."""
    frame_tree = await self._get_frame_tree_for(handler, session_id)
    for frame_node in WebElement._walk_frames(frame_tree):
        candidate_frame_id = frame_node.get('id', '')
        if not candidate_frame_id:
            continue
        owner_backend_id = await self._owner_backend_for(
            handler, session_id, candidate_frame_id
        )
        if owner_backend_id == backend_node_id:
            return candidate_frame_id, frame_node.get('url')
    return None, None
```

**Why this is necessary**:

- `DOM.describeNode` sometimes doesn't include the `contentDocument.frameId` for cross-origin or lazy-loaded iframes
- The frame tree always contains all frames (even OOPIFs), so we can find it indirectly

**Outcome**:

- **If `frameId` found**: Proceed to Step 4.
- **If still not found**: The iframe is likely an OOPIF in a separate target; proceed to Step 3.

---

#### **Step 3: Resolve OOPIF by Parent Frame**

**Goal**: For Out-of-Process Iframes, find the correct target, attach to it, and obtain the `frameId` from the target's frame tree (and the routing `sessionId` when needed).

**When this runs**:

- Same-origin / in-process iframes that already have a `frameId` and **no** `backendNodeId` skip this step (they are handled directly).
- Cross-origin / OOPIF iframes (with `backendNodeId`) or iframes whose `frameId` could not be resolved via Step 2 use this step.

**Strategy**:

**3a. Direct child target lookup (fast path)**:

1. Call `Target.getTargets()` to list all debugging targets.
2. Filter targets where `type` is `"iframe"` or `"page"` and `parentFrameId` matches our parent frame.
3. If there is **exactly one** matching child **and we don't have a `backendNodeId`**, attach directly to that target with `Target.attachToTarget(targetId, flatten=true)`.
4. Fetch `Page.getFrameTree(sessionId)` for that target; the root frame of this tree is our iframe's frame.

When there are **multiple** direct children or we have a `backendNodeId` (typical OOPIF case), Pydoll iterates over each child target:

1. Attach via `Target.attachToTarget(flatten=true)`.
2. Fetch `Page.getFrameTree(sessionId)` and read the root `frame.id`.
3. Call `DOM.getFrameOwner(frameId=root_id)` on the **main** connection.
4. Compare the returned `backendNodeId` with our iframe element's `backendNodeId`.
5. The child whose root owner matches is selected as the correct OOPIF target.

**3b. Fallback: Scan all targets (root owner + child search)**:

If no suitable direct child is found (or when `parentFrameId` information is incomplete), Pydoll falls back to scanning **all** iframe/page targets:

1. Iterate all iframe/page targets.
2. Attach to each and fetch its frame tree.
3. First, try to match the **root frame owner** via `DOM.getFrameOwner(root_frame_id)` against our iframe's `backendNodeId`.
4. If that does not match, look for a **child frame** whose `parentId` equals our `content_frame_id` (this covers cases where the OOPIF is nested under an intermediate frame).

**Code**:

```python
# From pydoll/interactions/iframe.py
async def _resolve_oopif_by_parent(
    self,
    content_frame_id: str,
    backend_node_id: Optional[int],
    base_handler: Optional[ConnectionHandler] = None,
    base_session_id: Optional[str] = None,
) -> tuple[Optional[ConnectionHandler], Optional[str], Optional[str], Optional[str]]:
    """Resolve an OOPIF using the content frame id."""
    browser_handler = ConnectionHandler(
        connection_port=self._element._connection_handler._connection_port
    )
    targets_response: GetTargetsResponse = await browser_handler.execute_command(
        TargetCommands.get_targets()
    )
    target_infos = targets_response.get('result', {}).get('targetInfos', [])

    # The handler that can resolve DOM.getFrameOwner for the element's context.
    # When the <iframe> lives inside a nested OOPIF, the Tab-level handler has
    # no visibility; we must route through the session that originally found
    # the element.
    owner_handler = base_handler or self._element._connection_handler
    owner_session_id = base_session_id

    # Strategy 3a: Direct children (fast path)
    direct_children = [
        target_info
        for target_info in target_infos
        if target_info.get('type') in {'iframe', 'page'}
        and target_info.get('parentFrameId') == content_frame_id
    ]

    is_single_child = len(direct_children) == 1
    for child_target in direct_children:
        attach_response: AttachToTargetResponse = await browser_handler.execute_command(
            TargetCommands.attach_to_target(
                target_id=child_target['targetId'], flatten=True
            )
        )
        attached_session_id = attach_response.get('result', {}).get('sessionId')
        if not attached_session_id:
            continue

        frame_tree = await self._get_frame_tree_for(browser_handler, attached_session_id)
        root_frame = (frame_tree or {}).get('frame', {})
        root_frame_id = root_frame.get('id', '')

        # Same-origin / simple case: single child and no backend_node_id
        if is_single_child and root_frame_id and backend_node_id is None:
            return (
                browser_handler,
                attached_session_id,
                root_frame_id,
                root_frame.get('url'),
            )

        # OOPIF case: confirm ownership via DOM.getFrameOwner
        if root_frame_id and backend_node_id is not None:
            owner_backend_id = await self._owner_backend_for(
                owner_handler, owner_session_id, root_frame_id
            )
            if owner_backend_id == backend_node_id:
                return (
                    browser_handler,
                    attached_session_id,
                    root_frame_id,
                    root_frame.get('url'),
                )

    # Strategy 3b: Scan all targets (root owner + child search)
    for target_info in target_infos:
        if target_info.get('type') not in {'iframe', 'page'}:
            continue
        attach_response = await browser_handler.execute_command(
            TargetCommands.attach_to_target(
                target_id=target_info.get('targetId', ''), flatten=True
            )
        )
        attached_session_id = attach_response.get('result', {}).get('sessionId')
        if not attached_session_id:
            continue

        frame_tree = await self._get_frame_tree_for(browser_handler, attached_session_id)
        root_frame = (frame_tree or {}).get('frame', {})
        root_frame_id = root_frame.get('id', '')

        # Direct match: content_frame_id equals this target's root frame ID
        if root_frame_id and root_frame_id == content_frame_id:
            return (
                browser_handler,
                attached_session_id,
                root_frame_id,
                root_frame.get('url'),
            )

        # Try matching root owner by backend_node_id
        if root_frame_id and backend_node_id is not None:
            owner_backend_id = await self._owner_backend_for(
                owner_handler, owner_session_id, root_frame_id
            )
            if owner_backend_id == backend_node_id:
                return (
                    browser_handler,
                    attached_session_id,
                    root_frame_id,
                    root_frame.get('url'),
                )

        # Fallback: match a child frame whose parentId equals content_frame_id
        child_frame_id = IFrameContextResolver._find_child_by_parent(
            frame_tree, content_frame_id
        )
        if child_frame_id:
            return browser_handler, attached_session_id, child_frame_id, None

    return None, None, None, None
```

**Outcome**:

- **If OOPIF resolved**: We now have `sessionId`, `session_handler`, and `frameId`; proceed to Step 4.
- **If resolution fails**: Raise `InvalidIFrame` exception (handled in `_ensure_iframe_context`).

---

#### **Step 4: Create Isolated World**

**Goal**: Create a separate JavaScript execution context in the resolved frame.

**Method**: `Page.createIsolatedWorld(frameId, worldName='pydoll::iframe::<frameId>', grantUniversalAccess=true)`

**Parameters**:
- `frameId`: The frame where the isolated world is created
- `worldName`: Identifier for the world (useful for debugging)
- `grantUniversalAccess`: Allows cross-origin access (needed for automation)

**Response**: `{ executionContextId: 42 }`

**Code**:

```python
# From pydoll/elements/web_element.py
@staticmethod
async def _create_isolated_world_for_frame(
    frame_id: str,
    handler: ConnectionHandler,
    session_id: Optional[str],
) -> int:
    """Create an isolated world for the given frame."""
    create_command = PageCommands.create_isolated_world(
        frame_id=frame_id,
        world_name=f'pydoll::iframe::{frame_id}',
        grant_universal_access=True,
    )
    if session_id:
        create_command['sessionId'] = session_id
    create_response: CreateIsolatedWorldResponse = await handler.execute_command(create_command)
    execution_context_id = create_response.get('result', {}).get('executionContextId')
    if not execution_context_id:
        raise InvalidIFrame('Unable to create isolated world for iframe')
    return execution_context_id
```

**Why isolated world**:

- **Isolation**: Our automation JavaScript doesn't interfere with the iframe's JavaScript
- **Anti-detection**: The iframe cannot detect our presence easily
- **Consistency**: Behavior is predictable regardless of iframe's script environment

**Outcome**: We have an `executionContextId` for running JavaScript in the iframe.

---

#### **Step 5: Pin the Iframe Document as a Runtime Object**

**Goal**: Obtain an `objectId` reference to the iframe's `document.documentElement` (the `<html>` element of the iframe).

**Method**: `Runtime.evaluate(expression='document.documentElement', contextId=executionContextId)`

**Why we need this**:

- To execute **relative queries** (like `element.querySelector()`) inside the iframe
- The `objectId` allows using `Runtime.callFunctionOn(objectId, ...)` with `this` bound to the iframe's document

**Code**:

```python
# From pydoll/elements/web_element.py
async def _set_iframe_document_object_id(self, execution_context_id: int) -> None:
    """Evaluate document.documentElement in the iframe context and cache its object id."""
    evaluate_command = RuntimeCommands.evaluate(
        expression='document.documentElement',
        context_id=execution_context_id,
    )
    if self._iframe_context and self._iframe_context.session_id:
        evaluate_command['sessionId'] = self._iframe_context.session_id
    evaluate_response: EvaluateResponse = await (
        (self._iframe_context.session_handler if self._iframe_context else None)
        or self._connection_handler
    ).execute_command(evaluate_command)
    result_object = evaluate_response.get('result', {}).get('result', {})
    document_object_id = result_object.get('objectId')
    if not document_object_id:
        raise InvalidIFrame('Unable to obtain document reference for iframe')
    if self._iframe_context:
        self._iframe_context.document_object_id = document_object_id
```

**Outcome**: The `_IFrameContext` is now fully populated and cached on the `WebElement`.

---

#### **Step 6: Cache and Propagate Context**

**Goal**: Store the resolved context on the iframe element and propagate it to all child elements found within the iframe.

**Caching**:

```python
# From pydoll/elements/web_element.py
def _init_iframe_context(
    self,
    frame_id: str,
    document_url: Optional[str],
    session_handler: Optional[ConnectionHandler],
    session_id: Optional[str],
) -> None:
    """Initialize and cache iframe context on this element."""
    self._iframe_context = _IFrameContext(frame_id=frame_id, document_url=document_url)
    # Clean up routing attributes (these were for nested iframes)
    if hasattr(self, '_routing_session_handler'):
        delattr(self, '_routing_session_handler')
    if hasattr(self, '_routing_session_id'):
        delattr(self, '_routing_session_id')
    # Store OOPIF routing if needed
    if session_handler and session_id:
        self._iframe_context.session_handler = session_handler
        self._iframe_context.session_id = session_id
```

**Propagation** (when finding elements inside the iframe):

```python
# From pydoll/elements/mixins/find_elements_mixin.py
def _apply_iframe_context_to_element(
    self, element: WebElement, iframe_context: _IFrameContext | None
) -> None:
    """Propagate iframe context to the newly created element."""
    if not iframe_context:
        return
    
    # If the child element is also an iframe, set up routing
    if getattr(element, 'is_iframe', False):
        element._routing_session_handler = (
            iframe_context.session_handler or self._connection_handler
        )
        element._routing_session_id = iframe_context.session_id
        element._routing_parent_frame_id = iframe_context.frame_id
        return
    
    # Otherwise, inject the parent iframe's context
    element._iframe_context = iframe_context
```

**Why propagation matters**:

- Elements found inside an iframe inherit the iframe's context
- This ensures subsequent operations (click, type, find nested elements) automatically use the correct routing
- Nested iframes receive routing information so they can resolve their own context relative to the parent iframe

---

## Session Routing and Flattened Mode

### The Flattened Session Model

As discussed in [Deep Dive → Fundamentals → CDP](./cdp.md), traditional CDP uses separate WebSocket connections for each target. **Flattened mode** is an optimization where all targets share a single WebSocket connection, with commands routed using a `sessionId`.

```mermaid
graph TB
    subgraph "Traditional Mode"
        WS1[WebSocket 1] --> MainPage[Main Page Target]
        WS2[WebSocket 2] --> Iframe1[OOPIF Target 1]
        WS3[WebSocket 3] --> Iframe2[OOPIF Target 2]
    end
    
    subgraph "Flattened Mode"
        WS[Single WebSocket] --> Router{CDP Router}
        Router -->|sessionId: null| MainPage2[Main Page Target]
        Router -->|sessionId: session-1| Iframe3[OOPIF Target 1]
        Router -->|sessionId: session-2| Iframe4[OOPIF Target 2]
    end
```

### How Session Routing Works

**When attaching to an OOPIF**:

```python
response = await handler.execute_command(
    TargetCommands.attach_to_target(targetId="iframe-target-id", flatten=True)
)
session_id = response['result']['sessionId']  # e.g., "8E6C...-1234"
```

**When sending a command to that OOPIF**:

```python
command = PageCommands.get_frame_tree()
command['sessionId'] = 'session-1'  # Route to the OOPIF
response = await handler.execute_command(command)
```

The browser's CDP implementation routes the command to the correct target based on the `sessionId`.

### Pydoll's Command Routing

Every command sent by Pydoll elements is automatically routed to the correct target:

```python
# From pydoll/elements/mixins/find_elements_mixin.py
def _resolve_routing(self) -> tuple[ConnectionHandler, Optional[str]]:
    """Resolve handler and sessionId for the current context."""
    # Check if element has an iframe context with OOPIF routing
    iframe_context = getattr(self, '_iframe_context', None)
    if iframe_context and getattr(iframe_context, 'session_handler', None):
        return iframe_context.session_handler, getattr(iframe_context, 'session_id', None)
    
    # Check if element has inherited routing from a parent iframe
    routing_handler = getattr(self, '_routing_session_handler', None)
    if routing_handler is not None:
        return routing_handler, getattr(self, '_routing_session_id', None)
    
    # Default: use the tab's main connection
    return self._connection_handler, None

async def _execute_command(
    self, command: Command[T_CommandParams, T_CommandResponse]
) -> T_CommandResponse:
    """Execute CDP command via resolved handler (60s timeout)."""
    handler, session_id = self._resolve_routing()
    if session_id:
        command['sessionId'] = session_id
    return await handler.execute_command(command, timeout=60)
```

**Routing logic**:

1. **Element inside OOPIF iframe**: Use `iframe_context.session_id` and `iframe_context.session_handler`
2. **Nested iframe (child of OOPIF)**: Use inherited `_routing_session_id` and `_routing_session_handler`
3. **Regular element or in-process iframe**: Use main connection (`_connection_handler`), no `sessionId`

### Extended Command Typing

To make `sessionId` type-safe, Pydoll extended the `Command` TypedDict:

```python
# From pydoll/protocol/base.py
class Command(TypedDict, Generic[T_CommandParams, T_CommandResponse]):
    """Base structure for all commands."""
    id: NotRequired[int]
    method: str
    params: NotRequired[T_CommandParams]
    sessionId: NotRequired[str]  # Added for flattened session routing
```

This allows type-checkers to recognize `command['sessionId'] = '...'` as valid without suppressing type warnings.

---

## Performance Considerations

### Caching Strategy

**First access is expensive**:

- `DOM.describeNode`: 1 round-trip
- Frame tree retrieval: 1+ round-trips (main + OOPIF targets)
- `DOM.getFrameOwner` per frame: N round-trips (in worst case)
- `Target.getTargets` + attachments: 1 + M round-trips (M = number of OOPIF targets)
- `Page.createIsolatedWorld`: 1 round-trip
- `Runtime.evaluate` (document): 1 round-trip

**Total**: Potentially 5-20+ round-trips depending on page structure.

**Subsequent access is O(1)**:

- `iframe_context` is cached on the `WebElement` instance
- Accessing `await iframe.iframe_context` multiple times returns the cached value immediately
- All elements found within the iframe inherit the context (no re-resolution)

### Optimization: Direct Child Target Lookup

In `_resolve_oopif_by_parent`, Pydoll first checks for direct children by `parentFrameId`:

```python
direct_children = [
    target_info
    for target_info in target_infos
    if target_info.get('type') in {'iframe', 'page'}
    and target_info.get('parentFrameId') == content_frame_id
]
if direct_children:
    # Attach immediately, skip scanning all targets
```

**Why this helps**:

- Most OOPIFs have `parentFrameId` correctly set
- Avoids attaching to every target speculatively
- Reduces round-trips from O(targets) to O(1) in the common case

### Asynchronous Parallel Resolution (Future Enhancement)

Currently, frame owner matching is sequential (check each frame one by one). A future optimization could parallelize:

```python
# Current (sequential)
for frame_node in frames:
    owner = await self._owner_backend_for(...)
    if owner == backend_node_id:
        return frame_node['id']

# Potential (parallel)
results = await asyncio.gather(*(
    self._owner_backend_for(..., frame['id'])
    for frame in frames
))
for i, owner in enumerate(results):
    if owner == backend_node_id:
        return frames[i]['id']
```

This would reduce latency from `N * RTT` to `RTT` (where RTT = round-trip time).

---

## Failure Modes and Debugging

### Common Failure Scenarios

#### 1. **InvalidIFrame: Unable to resolve frameId**

**Cause**:

- The iframe is dynamically created and hasn't fully initialized
- The iframe is sandboxed with restrictive policies
- Network issues delayed iframe loading

**Solutions**:

- **Wait for iframe**: Use `await tab.find(id='iframe', timeout=10)` with a timeout
- **Check sandbox attribute**: Restrictive sandboxing (`<iframe sandbox>`) may block some CDP operations
- **Retry strategy**: Implement retry logic with exponential backoff

**Debugging**:

```python
try:
    iframe = await tab.find(id='problem-iframe')
    context = await iframe.iframe_context
except InvalidIFrame as e:
    # Inspect what we have
    node_info = await iframe._describe_node(object_id=iframe._object_id)
    print(f"Node info: {node_info}")
    
    # Check frame tree manually
    frame_tree = await WebElement._get_frame_tree_for(tab._connection_handler, None)
    print(f"Frame tree: {frame_tree}")
```

#### 2. **InvalidIFrame: Unable to create isolated world**

**Cause**:

- Frame has been destroyed/navigated away between resolution steps
- Chrome bug (rare)

**Solutions**:

- **Re-resolve context**: Clear cached context and re-access
- **Check navigation**: Ensure iframe isn't navigating during resolution

**Debugging**:

```python
# Clear cache and retry
iframe._iframe_context = None
context = await iframe.iframe_context
```

#### 3. **InvalidIFrame: Unable to obtain document reference**

**Cause**:

- The isolated world was created but the document isn't ready
- Frame is about to navigate

**Solutions**:

- Wait for frame load: Use Page events to detect `Page.frameNavigated` or `Page.loadEventFired`
- Retry with a small delay

#### 4. **Session routing failures (command times out or returns error)**

**Cause**:

- OOPIF target was detached (page navigated, iframe removed)
- `sessionId` is stale

**Solutions**:

- **Re-attach to target**: Create a new `ConnectionHandler` and re-resolve OOPIF
- **Validate target**: Call `Target.getTargets()` to check if target still exists

**Debugging**:

```python
# Check if session is still valid
targets = await handler.execute_command(TargetCommands.get_targets())
active_sessions = [t['targetId'] for t in targets['result']['targetInfos']]
print(f"Active targets: {active_sessions}")

if iframe._iframe_context and iframe._iframe_context.session_id:
    print(f"Our session: {iframe._iframe_context.session_id}")
```

### Diagnostic Tools

#### Enable CDP logging

```python
import logging
logging.basicConfig(level=logging.DEBUG)
logger = logging.getLogger('pydoll')
logger.setLevel(logging.DEBUG)
```

This logs all CDP commands and responses, useful for tracing iframe resolution steps.

#### Inspect iframe context

```python
iframe = await tab.find(id='my-iframe')
ctx = await iframe.iframe_context

print(f"Frame ID: {ctx.frame_id}")
print(f"Document URL: {ctx.document_url}")
print(f"Execution Context ID: {ctx.execution_context_id}")
print(f"Document Object ID: {ctx.document_object_id}")
print(f"Session ID (OOPIF): {ctx.session_id}")
print(f"Session Handler: {ctx.session_handler}")
```

---

## Conclusion

Pydoll's iframe handling represents a sophisticated implementation of CDP's frame management capabilities. By understanding:

- **The DOM**: Tree structure and node identification
- **Iframes**: Independent document contexts and security boundaries
- **OOPIFs**: Site isolation and target-based architecture
- **CDP domains**: Page, DOM, Target, Runtime coordination
- **Execution contexts**: Isolated worlds for clean automation
- **Identifiers**: backendNodeId, frameId, targetId, sessionId, executionContextId, objectId relationships
- **Resolution pipeline**: Multi-stage fallback strategy for finding frames
- **Session routing**: Flattened mode and automatic command routing

you can appreciate why manual context switching is eliminated. The complexity is real, but Pydoll abstracts it behind a simple, intuitive API:

```python
iframe = await tab.find(id='login-frame')
username = await iframe.find(name='username')
await username.type_text('user@example.com')
```

Three lines. No context switching. No target attachment. No session management. It just works.

---

## Further Reading

- **CDP Specification**: [Chrome DevTools Protocol - Page Domain](https://chromedevtools.github.io/devtools-protocol/tot/Page/)
- **CDP Specification**: [Chrome DevTools Protocol - DOM Domain](https://chromedevtools.github.io/devtools-protocol/tot/DOM/)
- **CDP Specification**: [Chrome DevTools Protocol - Target Domain](https://chromedevtools.github.io/devtools-protocol/tot/Target/)
- **CDP Specification**: [Chrome DevTools Protocol - Runtime Domain](https://chromedevtools.github.io/devtools-protocol/tot/Runtime/)
- **Chromium Site Isolation**: [Site Isolation - The Chromium Projects](https://www.chromium.org/Home/chromium-security/site-isolation/)
- **Content Scripts & Isolated Worlds**: [Chrome Extensions - Content Scripts](https://developer.chrome.com/docs/extensions/mv3/content_scripts/)
- **Pydoll Documentation**: [Deep Dive → Fundamentals → Chrome DevTools Protocol](./cdp.md)
- **Pydoll Documentation**: [Features → Automation → IFrames](../../features/automation/iframes.md)

---

!!! tip "Design Philosophy"
    The goal of Pydoll's iframe handling is **ergonomic automation**: write code as if iframes don't exist, and let the library handle the complexity. This deep dive showed what happens behind the scenes—but you never have to think about it in your automation scripts.


================================================
FILE: docs/en/deep-dive/fundamentals/index.md
================================================
# Core Fundamentals

**Master the foundation, everything else becomes easier.**

This section covers the **bedrock technologies** that power Pydoll: the Chrome DevTools Protocol (CDP), WebSocket-based async communication, and Python's type system integration. These aren't just implementation details, they're the **fundamental design decisions** that make Pydoll fast, powerful, and type-safe.

## Why Fundamentals Matter

Most automation frameworks abstract away their communication layer, leaving you with a "black box" that works until it doesn't. When something breaks, debugging and optimization become difficult without understanding the underlying mechanisms.

**Pydoll takes a different approach**: we expose and explain the fundamentals, enabling you to work as both a **framework user** and a **protocol engineer**.

!!! quote "The Power of First Principles"
    **"If you know the way broadly, you will see it in all things."** - Miyamoto Musashi
    
    Understanding CDP, async communication, and type systems isn't just about Pydoll, it's about understanding **how modern browser automation works at its core**. This knowledge transfers to any CDP-based tool and any async Python project.

## The Three Pillars

### 1. Chrome DevTools Protocol (CDP)
**[→ Read CDP Deep Dive](./cdp.md)**

**The protocol that powers modern browser automation.**

CDP is Chrome's native debugging protocol, the same one Chrome DevTools (F12) uses. By communicating directly with CDP, Pydoll:

- **Eliminates WebDriver** (no Selenium overhead, no geckodriver/chromedriver intermediaries)
- **Gains deep control** (modify requests, intercept events, execute privileged operations)
- **Achieves native speed** (direct WebSocket communication, no HTTP polling)
- **Becomes undetectable** (no `navigator.webdriver`, no WebDriver fingerprints)

**What you'll learn:**

- How CDP organizes functionality into domains (Page, Network, DOM, Fetch, etc.)
- The command/event architecture that powers reactive automation
- Why CDP-based tools are **fundamentally more powerful** than Selenium
- How to read CDP documentation and extend Pydoll

**Why this matters**: CDP isn't just Pydoll's implementation detail, it's the foundation of modern browser automation. Puppeteer, Playwright, and similar tools all use CDP. Understanding it once provides knowledge applicable across multiple tools.

---

### 2. The Connection Layer
**[→ Read Connection Layer Architecture](./connection-layer.md)**

**Async communication done right.**

While CDP defines **what** you can do, the Connection Layer defines **how** Pydoll communicates with the browser. This is where protocol messages become Python objects, where async/await patterns enable concurrency, and where WebSockets provide real-time bidirectional communication.

**What you'll learn:**

- WebSocket architecture: persistent connections, message framing, keep-alive
- The async/await pattern: why `async def` and `await` enable concurrent automation
- Command/response correlation: how Pydoll matches responses to requests
- Event dispatching: how browser events trigger Python callbacks
- Error handling: timeout management, connection failures, graceful degradation

**Why this matters**: The connection layer is the communication backbone of Pydoll. Understanding it enables:
- **Effective debugging**: Inspect messages flowing between Python and Chrome
- **Performance optimization**: Identify latency sources and parallelize operations
- **Extension capabilities**: Add custom CDP commands or modify existing behavior

---

### 3. Python Type System Integration
**[→ Read Type System Deep Dive](./typing-system.md)**

**Types provide both safety and productivity.**

Python's type system (introduced in 3.5, enhanced in every version since) significantly improves development experience. Pydoll leverages `TypedDict`, `Literal`, `overload`, and generics to provide:

- **IDE autocomplete** for CDP response fields
- **Type checking** to catch bugs before runtime (`mypy`, `pyright`)
- **Self-documenting code** (function signatures reveal structure)
- **Refactoring safety** (rename a field, IDE updates all usages)

**What you'll learn:**

- How `TypedDict` models CDP event/response structures
- Why `overload` provides precise return types for `find()`/`query()`
- How generics (`TypeVar`, `Generic[T]`) enable flexible command construction
- Practical patterns: annotating callbacks, typing async functions, using `Literal`
- Tool integration: configuring mypy, leveraging IDE type inference

**Why this matters**: Type hints have become increasingly important in modern Python. Pydoll's comprehensive type coverage means:
- **Faster development**: Autocomplete reveals available fields and methods
- **Fewer bugs**: Type checker catches errors before they reach production
- **Better refactoring**: Change signatures confidently with IDE support

---

## How These Fundamentals Connect

Understanding how CDP, async communication, and type systems work **together** is key:

```mermaid
graph TB
    Python[Python Code:<br/>await tab.go_to#40;url#41;]
    
    Python --> TypeSystem[Type System:<br/>Function signature reveals<br/>parameters & return type]
    
    TypeSystem --> ConnectionLayer[Connection Layer:<br/>Serialize command to JSON,<br/>send via WebSocket]
    
    ConnectionLayer --> CDP[CDP:<br/>Browser receives<br/>Page.navigate command]
    
    CDP --> Browser[Chrome:<br/>Executes navigation,<br/>emits events]
    
    Browser --> CDPEvents[CDP Events:<br/>Page.loadEventFired,<br/>Network.requestWillBeSent]
    
    CDPEvents --> ConnectionLayer2[Connection Layer:<br/>Deserialize events,<br/>dispatch to callbacks]
    
    ConnectionLayer2 --> TypedDicts[TypedDict:<br/>Event data as<br/>typed dictionary]
    
    TypedDicts --> PythonCallback[Python Callback:<br/>IDE shows available fields<br/>via type inference]
```

**The flow**:

1. You write Python code with **type annotations** (Type System)
2. Code serializes to JSON and sends via **WebSocket** (Connection Layer)
3. Browser receives and executes **CDP commands** (CDP)
4. Browser emits **CDP events** back (CDP)
5. Events deserialize into **TypedDict instances** (Type System)
6. Your callbacks receive **type-safe event objects** (Type System)

Each layer **amplifies** the others:

- Types make CDP responses discoverable
- CDP's event model enables async patterns
- Async communication makes types essential (what fields exist on this response?)

## Learning Path

We recommend this progression:

### Step 1: CDP
**[Start Here: Chrome DevTools Protocol](./cdp.md)**

Understand the protocol that powers everything. Learn domains, commands, events, and how to read CDP documentation.

**Outcome**: You'll know how to find and use any CDP feature, not just what Pydoll exposes.

### Step 2: Connection Layer
**[Continue: Connection Layer Architecture](./connection-layer.md)**

Deep dive into WebSocket communication, async patterns, and event dispatching.

**Outcome**: You'll understand exactly how messages flow between Python and Chrome, enabling debugging and optimization.

### Step 3: Type System
**[Finish: Python Type System](./typing-system.md)**

Learn how Pydoll uses modern Python typing for safety and productivity.

**Outcome**: You'll write type-safe automation with full IDE support, catching bugs before they run.

## Prerequisites

To get the most from this section:

- **Python fundamentals** - Functions, classes, decorators
- **Basic async/await** - Understand `async def` and `await` keywords
- **JSON familiarity** - Know how objects/arrays serialize
- **Browser DevTools** - Have used Chrome Inspector (F12)  

**If you're new to async Python**, read this first: [Real Python: Async IO in Python](https://realpython.com/async-io-python/)

## Beyond the Basics

Once you've mastered these fundamentals, you'll be ready for:

- **[Internal Architecture](../architecture/browser-domain.md)** - How Pydoll's components fit together
- **[Network & Security](../network/index.md)** - Protocol-level understanding for proxies
- **[Fingerprinting](../fingerprinting/index.md)** - Detection techniques requiring CDP knowledge

## Common Questions

### "Do I need to understand this to use Pydoll?"

**No**, but understanding these fundamentals will make you more effective. Basic usage works fine without this knowledge. However, when you need to:
- Debug why something isn't working
- Optimize slow automation
- Extend Pydoll with custom CDP commands
- Understand error messages
- Contribute to the project

These fundamentals become very helpful.

### "Isn't this too low-level?"

This level of detail is intentional. Most frameworks hide these fundamentals, but abstraction comes with tradeoffs:

- Understanding enables better debugging
- Visibility enables optimization
- Knowledge enables extension

By teaching fundamentals, we enable you to go beyond what Pydoll provides out-of-the-box.

### "How much of this do I need to memorize?"

**None of it.** The goal is building mental models, not memorization. After reading these sections, you'll develop intuition for:

- "This needs CDP, let me check the protocol docs"
- "This is slow because of sequential await, let me parallelize"
- "This type error means I'm using the wrong field name"

The specifics fade, but the understanding remains.

## Philosophy

These fundamentals represent long-lasting knowledge:

- **CDP** is Chrome's native protocol and continues to evolve
- **Async/await** is Python's standard for concurrency
- **Type systems** are increasingly important in Python (PEP 484 onwards)

Learning these concepts provides value across your development career.

---

## Ready to Build Your Foundation?

Start with **[Chrome DevTools Protocol](./cdp.md)** to understand the protocol that powers everything. Then progress through the Connection Layer and Type System to complete your fundamental understanding.

**This is where automation becomes engineering.**

---

!!! tip "After Completing Fundamentals"
    Once you've mastered these concepts, you'll see them **everywhere** in Pydoll's architecture:
    
    - Browser/Tab/WebElement all use the **Connection Layer**
    - Network events all follow **CDP's event model**
    - All responses use **TypedDict** for type safety
    
    The fundamentals aren't separate from Pydoll, they **are** Pydoll's foundation.


================================================
FILE: docs/en/deep-dive/fundamentals/typing-system.md
================================================
# Python's Type System & Pydoll

Pydoll leverages Python's type system extensively to provide excellent IDE support, catch errors early, and make the API self-documenting. This guide explains the basics of type hints and how Pydoll uses them to enhance your development experience.

## Type Hints Basics

Type hints are optional annotations that specify what type of value a variable, parameter, or return value should be. They don't affect runtime behavior but enable powerful tooling.

### Simple Type Hints

```python
# Basic types
name: str = "Pydoll"
port: int = 9222
is_headless: bool = False
quality: float = 0.85

# Function annotations
def navigate(url: str, timeout: int = 30) -> bool:
    # ... implementation
    return True
```

### Container Types

```python
from typing import List, Dict, Optional

# Lists and dictionaries
urls: List[str] = ['https://example.com', 'https://google.com']
headers: Dict[str, str] = {'User-Agent': 'MyBot/1.0'}

# Optional values (can be None)
target_id: Optional[str] = None

# Modern syntax (Python 3.9+)
urls: list[str] = ['https://example.com']
headers: dict[str, str] = {'User-Agent': 'MyBot/1.0'}
```

!!! tip "Python 3.9+ Syntax"
    Pydoll's codebase uses the older `List[]`, `Dict[]` syntax for backward compatibility, but you can use lowercase `list[]`, `dict[]` in your code if you're on Python 3.9+.

## TypedDict: Structured Dictionaries

TypedDict allows you to define dictionary structures with specific keys and value types. This is **heavily used** in Pydoll's CDP protocol definitions.

### Basic TypedDict

```python
from typing import TypedDict

class UserInfo(TypedDict):
    name: str
    age: int
    email: str

# IDE knows exactly what keys exist
user: UserInfo = {
    'name': 'Alice',
    'age': 30,
    'email': 'alice@example.com'
}

# Autocomplete works!
print(user['name'])  # IDE suggests: name, age, email
```

### How Pydoll Uses TypedDict

Pydoll defines **every CDP command, response, and event** as a TypedDict. This means your IDE knows exactly what properties are available:

```python
# From pydoll/protocol/page/methods.py
class CaptureScreenshotParams(TypedDict, total=False):
    """Parameters for captureScreenshot."""
    format: ScreenshotFormat
    quality: int
    clip: Viewport
    fromSurface: bool
    captureBeyondViewport: bool
    optimizeForSpeed: bool

class CaptureScreenshotResult(TypedDict):
    """Result for captureScreenshot command."""
    data: str
```

When you call methods that return CDP responses, your IDE autocompletes the response keys:

```python
async def example():
    response = await tab.take_screenshot(as_base64=True)
    
    # IDE knows this is CaptureScreenshotResponse
    # and suggests 'result' -> 'data'
    screenshot_data = response['result']['data']  # Full autocomplete!
```

### Optional vs Required Fields

TypedDict supports optional fields using `NotRequired[]`:

```python
from typing import TypedDict, NotRequired

# From pydoll/protocol/network/methods.py
class GetCookiesParams(TypedDict):
    """Parameters for retrieving browser cookies."""
    urls: NotRequired[list[str]]  # This field is optional
```

The `total=False` flag makes **all** fields optional:

```python
class CaptureScreenshotParams(TypedDict, total=False):
    format: ScreenshotFormat  # All fields optional
    quality: int
    clip: Viewport
```

!!! info "Autocomplete Magic"
    When you type `response['`, your IDE shows you all available keys with their types. This is TypedDict's superpower in action!

## Enums: Type-Safe Constants

Enums provide type-safe constants that your IDE can autocomplete. Pydoll uses them extensively for CDP values.

### Basic Enums

```python
from enum import Enum

class ScreenshotFormat(str, Enum):
    JPEG = 'jpeg'
    PNG = 'png'
    WEBP = 'webp'

# IDE autocompletes available formats
format = ScreenshotFormat.PNG  # Type is ScreenshotFormat
print(format.value)  # 'png'
```

### Pydoll's Enum Usage

```python
from pydoll.constants import Key
from pydoll.protocol.page.types import ScreenshotFormat
from pydoll.protocol.input.types import KeyModifier

# Finding elements - uses kwargs, not enums
element = await tab.find(id='submit-btn')
element = await tab.find(class_name='btn-primary')
element = await tab.find(tag_name='button')

# Keyboard input - IDE suggests all keys
await element.press_keyboard_key(Key.ENTER)
await element.press_keyboard_key(Key.TAB)
await element.press_keyboard_key(Key.ESCAPE)

# Modifiers are integer enums (for special keys)
await element.press_keyboard_key(Key.TAB, modifiers=KeyModifier.SHIFT)

# Screenshot format enum
await tab.take_screenshot('file.webp', format=ScreenshotFormat.WEBP)
```

!!! tip "Enum Autocomplete"
    Type `Key.` or `ScreenshotFormat.` and your IDE shows all available options. No more memorizing strings!

## Function Overloads

Overloads allow a function to return different types based on its parameters. Pydoll uses this to provide precise type information.

### Basic Overload Example

```python
from typing import overload

# Overload signatures (not executed)
@overload
def process(data: str) -> str: ...

@overload
def process(data: int) -> int: ...

# Actual implementation
def process(data):
    return data * 2

# IDE knows return types
result1 = process("hello")  # Type: str
result2 = process(42)       # Type: int
```

### Pydoll's Overload Usage

The `find()` and `query()` methods return different types depending on the `find_all` parameter:

```python
# From pydoll/elements/mixins/find_elements_mixin.py
class FindElementsMixin:
    @overload
    async def find(
        self, find_all: Literal[False] = False, **kwargs
    ) -> WebElement: ...
    
    @overload
    async def find(
        self, find_all: Literal[True], **kwargs
    ) -> list[WebElement]: ...
    
    async def find(
        self, find_all: bool = False, **kwargs
    ) -> Union[WebElement, list[WebElement]]:
        # Implementation...
```

In your code:

```python
# find_all=False (default) - IDE knows return type is WebElement
button = await tab.find(id='submit-btn')
await button.click()  # Single element methods available!

# find_all=True - IDE knows return type is list[WebElement]
buttons = await tab.find(class_name='btn', find_all=True)
for btn in buttons:  # IDE knows this is a list!
    await btn.click()

# Same with query()
element = await tab.query('#submit-btn')  # Type: WebElement
elements = await tab.query('.btn', find_all=True)  # Type: list[WebElement]
```

!!! tip "Smart Type Inference"
    Your IDE automatically knows whether you're getting a single element or a list based on the `find_all` parameter. No casting or type assertions needed!

## Generic Types

Generics are like "type containers" that work with different types while preserving type information. Think of them as templates that adapt to whatever you put inside.

### Understanding Generics: A Simple Analogy

Imagine a `Box` that can hold anything. Without generics:

```python
# Without generics - IDE doesn't know what's inside
class Box:
    def __init__(self, content):
        self.content = content
    
    def get(self):
        return self.content

my_box = Box("hello")
item = my_box.get()  # Type: Unknown - could be anything!
```

With generics:

```python
from typing import Generic, TypeVar

T = TypeVar('T')  # T is a "type placeholder"

class Box(Generic[T]):
    def __init__(self, content: T):
        self.content = content
    
    def get(self) -> T:
        return self.content

# Now IDE knows exactly what's inside each box
string_box: Box[str] = Box("hello")
item1 = string_box.get()  # Type: str

number_box: Box[int] = Box(42)
item2 = number_box.get()  # Type: int

# List is a built-in generic
numbers: list[int] = [1, 2, 3]  # List that contains ints
names: list[str] = ["Alice", "Bob"]  # List that contains strings
```

!!! tip "Generics Simplify Type Hints"
    Instead of writing `Union[List[str], List[int], List[float], ...]` for every possible list type, generics let you write one reusable `list[T]` that adapts to whatever you put inside.

### Real-World Generic Example

```python
from typing import TypeVar, Generic

T = TypeVar('T')

class Response(Generic[T]):
    """A generic API response wrapper."""
    def __init__(self, data: T, status: int):
        self.data = data
        self.status = status
    
    def get_data(self) -> T:
        return self.data

# Each response preserves its data type
user_response: Response[dict] = Response({"name": "Alice"}, 200)
user_data = user_response.get_data()  # Type: dict

count_response: Response[int] = Response(42, 200)
count = count_response.get_data()  # Type: int
```

### How Pydoll Uses Generics

Pydoll's CDP command system uses generics to ensure the response type matches the command:

```python
# From pydoll/protocol/base.py
from typing import Generic, TypeVar

T_CommandParams = TypeVar('T_CommandParams')
T_CommandResponse = TypeVar('T_CommandResponse')

class Command(TypedDict, Generic[T_CommandParams, T_CommandResponse]):
    """Base structure for all commands."""
    id: NotRequired[int]
    method: str
    params: NotRequired[T_CommandParams]

class Response(TypedDict, Generic[T_CommandResponse]):
    """Base structure for all responses."""
    id: int
    result: T_CommandResponse
```

This means when you execute a command, the response type is automatically inferred:

```python
# PageCommands.navigate returns Command[NavigateParams, NavigateResult]
command = PageCommands.navigate('https://example.com')

# ConnectionHandler.execute_command preserves the generic type
response = await connection_handler.execute_command(command)

# IDE knows response['result'] is NavigateResult (not just "any dict")
frame_id = response['result']['frameId']  # Autocomplete works!
loader_id = response['result']['loaderId']  # All fields are known!
```

!!! info "Why Generics Matter in Pydoll"
    Without generics, every CDP response would just be typed as `dict[str, Any]`, and you'd lose all autocomplete. With generics, the IDE knows the exact structure of each response based on which command you sent.

## Union Types

Unions represent values that could be one of several types:

```python
from typing import Union

# Can be string or int
identifier: Union[str, int] = "user-123"
identifier = 456  # Also valid

# Modern syntax (Python 3.10+)
identifier: str | int = "user-123"
```

### Pydoll's Union Usage

```python
# File paths can be strings or Path objects
from pathlib import Path

async def upload_file(files: Union[str, Path, list[Union[str, Path]]]):
    # Handles multiple input types
    pass

# All of these work:
await tab.expect_file_chooser('/path/to/file.txt')
await tab.expect_file_chooser(Path('/path/to/file.txt'))
await tab.expect_file_chooser(['/file1.txt', Path('/file2.txt')])
```

## Practical Benefits in Pydoll

### 1. Intelligent Autocomplete

Your IDE suggests available keys, methods, and values:

```python
from pydoll.protocol.page.events import PageEvent
from pydoll.protocol.network.types import ResourceType
from pydoll.protocol.input.types import KeyModifier
from pydoll.constants import Key

# Autocomplete for event names
await tab.on(PageEvent.LOAD_EVENT_FIRED, callback)
await tab.on(PageEvent.JAVASCRIPT_DIALOG_OPENING, callback)

# Autocomplete for resource types
await tab.enable_fetch_events(resource_type=ResourceType.XHR)
await tab.enable_fetch_events(resource_type=ResourceType.DOCUMENT)

# Autocomplete for keys
await element.press_keyboard_key(Key.ENTER)
await element.press_keyboard_key(Key.TAB, modifiers=KeyModifier.SHIFT)

# Autocomplete for kwargs in find()
element = await tab.find(id='submit-btn')  # IDE suggests: id, class_name, tag_name, etc.
```

### 2. Catch Errors Early

Type checkers like mypy or Pylance catch errors before runtime:

```python
# Type checker catches this
await tab.take_screenshot('file.png', quality='high')  # Error: quality must be int

# Type checker catches this
event = await tab.find(id='button')
await tab.on(event, callback)  # Error: event is WebElement, not str

# Correct
await tab.take_screenshot('file.png', quality=90)
await tab.on(PageEvent.LOAD_EVENT_FIRED, callback)
```

### 3. Self-Documenting Code

Types serve as inline documentation:

```python
# You immediately know what each parameter expects
async def take_screenshot(
    self,
    path: Optional[str] = None,
    quality: int = 100,
    beyond_viewport: bool = False,
    as_base64: bool = False,
) -> Optional[str]:
    pass
```

### 4. CDP Response Navigation

Navigate complex CDP responses with confidence:

```python
# From pydoll/protocol/browser/methods.py
class GetVersionResult(TypedDict):
    protocolVersion: str
    product: str
    revision: str
    userAgent: str
    jsVersion: str

# In your code
version_info = await browser.get_version()

# IDE suggests all available keys
print(version_info['product'])         # Autocomplete!
print(version_info['userAgent'])       # Autocomplete!
print(version_info['protocolVersion']) # Autocomplete!
```

## Type Checking Your Code

### Using Pylance (VS Code)

Pylance provides real-time type checking in VS Code:

1. Install the Pylance extension
2. Set type checking mode in settings:

```json
{
    "python.analysis.typeCheckingMode": "basic"  // or "strict"
}
```

Now you get instant feedback:

```python
from pydoll.browser.chromium import Chrome

async def main():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Pylance shows parameter types as you type
        await tab.go_to('https://example.com', timeout=30)
        
        # Pylance warns about wrong types
        await tab.take_screenshot(quality='high')  # Warning!
```

### Using mypy

Run mypy to check your entire project:

```bash
pip install mypy
mypy your_script.py
```

Example output:

```
your_script.py:10: error: Argument "quality" to "take_screenshot" has incompatible type "str"; expected "int"
Found 1 error in 1 file (checked 1 source file)
```

## Pydoll's Protocol Type System

Pydoll's `protocol/` directory contains comprehensive type definitions for the entire Chrome DevTools Protocol:

```
pydoll/protocol/
├── base.py              # Generic Command, Response, CDPEvent types
├── browser/
│   ├── events.py        # BrowserEvent enum, event parameter TypedDicts
│   ├── methods.py       # Browser method enums, parameter/result TypedDicts
│   └── types.py         # Browser domain types (Bounds, PermissionType, etc.)
├── dom/
│   ├── events.py        # DOM event definitions
│   ├── methods.py       # DOM command definitions
│   └── types.py         # DOM types (Node, BackendNode, etc.)
├── page/
│   ├── events.py        # Page events (LOAD_EVENT_FIRED, etc.)
│   ├── methods.py       # Page methods (navigate, captureScreenshot, etc.)
│   └── types.py         # Page types (Frame, ScreenshotFormat, etc.)
├── network/
│   └── ...              # Network domain types
└── ...                  # Other CDP domains
```

### Example: Complete Type Flow

Let's trace a complete type flow from command to response:

```python
# 1. Method enum (protocol/page/methods.py)
class PageMethod(str, Enum):
    CAPTURE_SCREENSHOT = 'Page.captureScreenshot'

# 2. Parameter TypedDict (protocol/page/methods.py)
class CaptureScreenshotParams(TypedDict, total=False):
    format: ScreenshotFormat
    quality: int
    clip: Viewport

# 3. Result TypedDict (protocol/page/methods.py)
class CaptureScreenshotResult(TypedDict):
    data: str

# 4. Command creation (commands/page_commands.py)
class PageCommands:
    @staticmethod
    def capture_screenshot(
        format: Optional[ScreenshotFormat] = None,
        quality: Optional[int] = None,
        ...
    ) -> Command[CaptureScreenshotParams, CaptureScreenshotResult]:
        return {
            'method': PageMethod.CAPTURE_SCREENSHOT,
            'params': {...}
        }

# 5. Usage in Tab (browser/tab.py)
class Tab:
    async def take_screenshot(...) -> Optional[str]:
        response: CaptureScreenshotResponse = await self._execute_command(
            PageCommands.capture_screenshot(...)
        )
        screenshot_data = response['result']['data']  # Fully typed!
        return screenshot_data
```

Every step maintains type information, giving you autocomplete and type checking throughout!

## Best Practices

### 1. Let Pydoll's Types Guide You

Don't fight the types, they're there to help:

```python
# Good: Use kwargs (IDE autocompletes parameter names)
element = await tab.find(id='submit-btn')
button = await tab.find(class_name='btn-primary')

# Good: Use enums where applicable
from pydoll.constants import Key
await element.press_keyboard_key(Key.ENTER)

# Avoid: Magic strings
await element.press_keyboard_key('Enter')  # No autocomplete, error-prone
```

### 2. Explore Types in Your IDE

Hover over variables to see their types:

```python
# Hover over 'response' to see: Response[CaptureScreenshotResult]
response = await tab._execute_command(PageCommands.capture_screenshot(...))

# Hover over 'data' to see: str
data = response['result']['data']
```


### 3. Don't Over-Annotate

Python's type inference is smart, don't annotate everything:

```python
# Too much
name: str = "Alice"
count: int = 5
is_active: bool = True

# Let Python infer simple literals
name = "Alice"
count = 5
is_active = True

# Annotate when type isn't obvious
from typing import Optional

result: Optional[WebElement] = await tab.find(id='missing', raise_exc=False)
```

## Learn More

For deeper understanding of Python's type system and CDP protocol:

- **[Python typing documentation](https://docs.python.org/3/library/typing.html)**: Official Python typing reference
- **[PEP 484](https://peps.python.org/pep-0484/)**: The original type hints proposal
- **[Chrome DevTools Protocol](https://chromedevtools.github.io/devtools-protocol/)**: CDP documentation
- **[Deep Dive: CDP](./cdp.md)**: How Pydoll implements CDP
- **[API Reference: Protocol](../api/protocol/base.md)**: Pydoll's protocol type definitions

The type system transforms Pydoll from a simple automation library into a **type-safe, self-documenting, IDE-friendly** framework. It catches bugs before they happen and makes exploring the API a breeze!


================================================
FILE: docs/en/deep-dive/guides/index.md
================================================
# Practical Guides

**Theory meets practice, actionable patterns for real automation challenges.**

While the other Deep Dive sections explore **fundamentals** and **architecture**, this section provides **practical, battle-tested guides** for common automation scenarios. These aren't academic exercises, they're patterns refined through production use.

## The Purpose of Guides

You've learned:

- **[Fundamentals](../fundamentals/cdp.md)** - CDP, async, types
- **[Architecture](../architecture/browser-domain.md)** - Internal design patterns
- **[Network](../network/index.md)** - Protocols and proxies
- **[Fingerprinting](../fingerprinting/index.md)** - Detection and evasion

Now what? **How do you apply this knowledge to real problems?**

That's what guides are for: **bridging theory and practice**.

!!! quote "Practical Wisdom"
    **"In theory, theory and practice are the same. In practice, they are not."** - Yogi Berra
    
    Guides distill complex technical knowledge into **actionable patterns** you can use immediately. They show you **what works** in production, not just what's theoretically possible.

## Current Guides

### CSS Selectors vs XPath
**[→ Read Selectors Guide](./selectors-guide.md)**

**The eternal debate, solved with data and best practices.**

Choosing between CSS selectors and XPath isn't about preference. It's about understanding **tradeoffs**, **performance characteristics**, and **maintainability**.

**What you'll learn**:

- **Syntax comparison** - Side-by-side examples for common patterns
- **Performance benchmarks** - Real measurements, not myths
- **Power vs simplicity** - When CSS isn't enough (text matching, axes)
- **Browser support** - Compatibility and edge cases
- **Best practices** - When to use each, anti-patterns to avoid
- **Complex examples** - Real-world selector challenges solved

**Why this matters**: Element location is the **foundation** of automation. Choose the wrong tool, and you'll fight your selectors forever. Choose wisely, and automation becomes straightforward.

---

## Coming Soon

### Asyncio & Concurrent Automation
**Coming in future releases**

**Deep dive into Python's asyncio: event loop internals, practical concurrency patterns, and real-world examples.**

Understanding asyncio is fundamental to Pydoll. This guide provides a comprehensive analysis of Python's event loop, concurrency primitives, and how to apply them to browser automation without footguns.

**Will cover**:

- **Event Loop Internals**: How `asyncio.run()` works, task scheduling, and execution flow
- **Async/Await Deep Dive**: Coroutines, futures, and the async state machine
- **Concurrency Primitives**: `gather()`, `create_task()`, `TaskGroup`, and when to use each
- **Rate Limiting**: Semaphores, queues, and throttling strategies
- **Real-World Examples**: Multi-tab scraping, parallel form filling, coordinated browser instances
- **Common Pitfalls**: Blocking the event loop, task cancellation, exception propagation
- **Performance Analysis**: Profiling async code, identifying bottlenecks, optimizing I/O

**Why this matters**: Asyncio powers Pydoll's architecture. Master it, and you unlock true concurrent automation without race conditions or state corruption.

---

### Architectural Patterns & Robust Selectors
**Coming in future releases**

**PageObject pattern, maintainable selectors, and architectural approaches for scalable automation.**

Move beyond ad-hoc scripts to structured, maintainable automation architectures. Learn patterns that scale from simple scripts to production systems.

**Will cover**:

- **PageObject Pattern**: Encapsulating page structure, reducing duplication, improving maintainability
- **Robust Selector Strategies**: Building selectors that survive page changes, avoiding brittle locators
- **Component Abstraction**: Reusable components for common UI patterns (modals, dropdowns, tables)
- **Waiting Strategies**: Smart waiting patterns beyond simple timeouts
- **State Management**: Managing automation state across pages and flows
- **Testing Patterns**: How to structure automation code for testability
- **Real-World Architecture**: Production-ready project structure and organization

**Why this matters**: The difference between throwaway scripts and maintainable automation systems is architecture. Learn patterns that make your code resilient to change.

---

## Guide Philosophy

Guides follow consistent principles:

### 1. Production-Ready Code
All examples are **complete and tested**, not pseudocode or simplified demonstrations. You can copy-paste and adapt to your needs.

### 2. Real-World Scenarios
Guides address **actual problems** encountered in production automation, not contrived examples.

### 3. Tradeoff Analysis
When multiple approaches exist, guides **compare** them objectively with pros/cons, not just "here's one way."

### 4. Progressive Complexity
Start simple, add complexity incrementally. Basic pattern first, then edge cases and advanced variations.

### 5. Anti-Patterns Highlighted
Show **what NOT to do** explicitly, common mistakes caught through code review or production debugging.

## How to Use Guides

Guides are **reference material**, not sequential tutorials:

- **Skim** for patterns relevant to your current problem  
- **Bookmark** guides you'll need repeatedly  
- **Adapt** examples to your specific context  
- **Combine** patterns from multiple guides  

Don't read sequentially cover-to-cover.  
Don't blindly copy without understanding tradeoffs.  
Don't use outdated patterns (check publication date).  

## Contributing Guides

Have a pattern worth sharing? Guides are **community-driven**:

**What makes a good guide**:

- Solves a **real problem** encountered in production
- Provides **working code**, not just concepts
- Compares **multiple approaches** with tradeoffs
- Highlights **common mistakes** explicitly
- Explains **why**, not just **how**

See [Contributing](../../CONTRIBUTING.md) for submission guidelines.

## Guides vs Features Documentation

**Confused about the difference?**

|| Features Documentation | Deep Dive Guides |
|---|---|---|
| **Purpose** | Teach what Pydoll can do | Show how to solve problems |
| **Scope** | Single method/feature | Multiple features combined |
| **Depth** | API reference + examples | Patterns + tradeoffs + best practices |
| **Order** | Structured by component | Structured by problem |
| **Examples** | Simple, isolated | Complex, production-ready |

**Use Features for**: Learning Pydoll's API  
**Use Guides for**: Solving real automation challenges

## Beyond Guides

After mastering practical patterns:

- **[Architecture](../architecture/browser-domain.md)** - Understand why patterns work
- **[Network](../network/index.md)** - Network-level optimization
- **[Fingerprinting](../fingerprinting/evasion-techniques.md)** - Anti-detection techniques

Guides provide **immediate value**. Architecture provides **deep understanding**. Both make you effective.

---

## Ready for Practical Patterns?

Start with **[CSS Selectors vs XPath](./selectors-guide.md)** to master element location, the foundation of all automation.

**More guides coming soon. Star the repo to stay updated!**

---

!!! tip "Request a Guide"
    Have a automation pattern you'd like documented? Open an issue titled "Guide Request: [Topic]" describing:
    
    - The problem you're trying to solve
    - What you've tried so far
    - Why existing documentation doesn't cover it
    
    We prioritize guides based on community need.

## Quick Reference

**Available Now:**

- [CSS Selectors vs XPath](./selectors-guide.md)

**Coming Soon:**

- Asyncio & Concurrent Automation
- Architectural Patterns & Robust Selectors

**Timeline**: New guides added based on community feedback and production learnings.


================================================
FILE: docs/en/deep-dive/guides/selectors-guide.md
================================================
# CSS Selectors vs XPath: A Complete Guide

When using the `query()` method, you have two powerful selector languages at your disposal: CSS Selectors and XPath. Understanding when and how to use each is crucial for effective element location.

## Fundamental Differences

| Aspect | CSS Selector | XPath |
|--------|--------------|-------|
| **Syntax** | Simple, CSS-like | XML path language |
| **Performance** | Faster (native browser support) | Slightly slower |
| **Direction** | Only traverses down and sideways | Can traverse in any direction |
| **Text Matching** | Limited (pseudo-selectors) | Powerful text functions |
| **Complexity** | Best for simple to moderate cases | Excels at complex relationships |
| **Readability** | More intuitive for web developers | Steeper learning curve |

## When to Use CSS Selectors

CSS selectors are ideal for:

- Simple element selection by ID, class, or tag
- Direct parent-child relationships
- Attribute matching with simple patterns
- Performance-critical scenarios
- When traversing downward in the DOM

```python
# Clean and performant CSS examples
await tab.query("#login-form")
await tab.query(".submit-button")
await tab.query("div.container > p.intro")
await tab.query("input[type='email'][required]")
await tab.query("ul.menu li:first-child")
```

## When to Use XPath

XPath is ideal for:

- Complex text matching and partial text searches
- Traversing upward to parent elements
- Finding elements relative to siblings
- Conditional logic in selectors
- Complex DOM relationships

```python
# Powerful XPath examples
await tab.query("//button[contains(text(), 'Submit')]")
await tab.query("//input[@name='email']/parent::div")
await tab.query("//td[text()='John']/following-sibling::td[2]")
await tab.query("//div[contains(@class, 'product') and @data-price > 100]")
```

## CSS Selector Syntax Reference

### Basic Selectors

```python
# Element selector
await tab.query("div")              # First <div> element
await tab.query("div", find_all=True)  # All <div> elements
await tab.query("button")           # First <button> element

# ID selector
await tab.query("#username")        # Element with id="username"

# Class selector
await tab.query(".submit-btn")      # First element with class="submit-btn"
await tab.query(".submit-btn", find_all=True)  # All elements with class
await tab.query(".btn.primary")     # First element with both classes

# Universal selector
await tab.query("*", find_all=True) # All elements
```

### Combinators

```python
# Descendant combinator (space)
await tab.query("div p")            # First <p> inside <div>
await tab.query("div p", find_all=True)  # All <p> inside <div> (any depth)

# Child combinator (>)
await tab.query("div > p")          # First <p> that is direct child of <div>
await tab.query("div > p", find_all=True)  # All <p> that are direct children

# Adjacent sibling combinator (+)
await tab.query("h1 + p")           # <p> immediately after <h1>

# General sibling combinator (~)
await tab.query("h1 ~ p")           # First <p> sibling after <h1>
await tab.query("h1 ~ p", find_all=True)  # All <p> siblings after <h1>
```

### Attribute Selectors

```python
# Attribute exists
await tab.query("input[required]")                # First input with 'required'
await tab.query("input[required]", find_all=True) # All inputs with 'required'

# Attribute equals
await tab.query("input[type='email']")            # First email input
await tab.query("input[type='email']", find_all=True)  # All email inputs

# Attribute contains word
await tab.query("div[class~='active']")           # First div with 'active' class

# Attribute starts with
await tab.query("a[href^='https://']")            # First HTTPS link
await tab.query("a[href^='https://']", find_all=True)  # All HTTPS links

# Attribute ends with
await tab.query("img[src$='.png']")               # First PNG image
await tab.query("img[src$='.png']", find_all=True)     # All PNG images

# Attribute contains substring
await tab.query("a[href*='example']")             # First link with 'example'
await tab.query("a[href*='example']", find_all=True)   # All links with 'example'

# Case-insensitive matching
await tab.query("input[type='text' i]")           # Case-insensitive match
```

### Pseudo-Classes

```python
# Structural pseudo-classes
await tab.query("li:first-child")                 # First <li> that is first child
await tab.query("li:last-child")                  # First <li> that is last child
await tab.query("li:nth-child(2)")                # First <li> that is 2nd child
await tab.query("li:nth-child(odd)", find_all=True)  # All odd-numbered <li>
await tab.query("li:nth-child(even)", find_all=True)  # All even-numbered <li>
await tab.query("li:nth-child(3n)", find_all=True)    # Every 3rd <li>

# Type-based pseudo-classes
await tab.query("p:first-of-type")                # First <p> among siblings
await tab.query("p:last-of-type")                 # Last <p> among siblings
await tab.query("p:nth-of-type(2)")               # Second <p> among siblings

# State pseudo-classes
await tab.query("input:enabled")                  # First enabled input
await tab.query("input:enabled", find_all=True)   # All enabled inputs
await tab.query("input:disabled")                 # First disabled input
await tab.query("input:checked")                  # First checked checkbox/radio
await tab.query("input:focus")                    # Currently focused input

# Other useful pseudo-classes
await tab.query("div:empty")                      # First empty element
await tab.query("div:empty", find_all=True)       # All empty elements
await tab.query("div:not(.exclude)")              # First div without class
await tab.query("div:not(.exclude)", find_all=True)  # All divs without class
```

## XPath Syntax Reference

### Basic Path Expressions

```python
# Absolute path (from root)
await tab.query("/html/body/div")                 # First div at exact path

# Relative path (from anywhere)
await tab.query("//div")                          # First <div> element
await tab.query("//div", find_all=True)           # All <div> elements
await tab.query("//div/p")                        # First <p> inside any <div>
await tab.query("//div/p", find_all=True)         # All <p> inside any <div>

# Current node
await tab.query("./div")                          # First <div> relative to current

# Parent node
await tab.query("..")                             # Parent of current node
```

### Attribute Selection

```python
# Basic attribute matching
await tab.query("//input[@type='email']")         # First email input
await tab.query("//input[@type='email']", find_all=True)  # All email inputs
await tab.query("//div[@id='content']")           # Div with id='content'

# Multiple attributes
await tab.query("//input[@type='text' and @required]")  # First match
await tab.query("//input[@type='text' and @required]", find_all=True)  # All matches
await tab.query("//div[@class='card' or @class='panel']")  # First card or panel

# Attribute exists
await tab.query("//button[@disabled]")            # First disabled button
await tab.query("//button[@disabled]", find_all=True)  # All disabled buttons
```

## XPath Axes (Directional Navigation)

The real power of XPath comes from its ability to navigate in any direction through the DOM tree.

### Axes Reference Table

| Axis | Direction | Description | Example |
|------|-----------|-------------|---------|
| `child::` | Down | Direct children only | `//div/child::p` |
| `descendant::` | Down | All descendants (any depth) | `//div/descendant::a` |
| `parent::` | Up | Immediate parent | `//input/parent::div` |
| `ancestor::` | Up | All ancestors (any depth) | `//span/ancestor::div` |
| `following-sibling::` | Sideways | Siblings after current | `//h1/following-sibling::p` |
| `preceding-sibling::` | Sideways | Siblings before current | `//p/preceding-sibling::h1` |
| `following::` | Forward | All nodes after current | `//h1/following::*` |
| `preceding::` | Backward | All nodes before current | `//h1/preceding::*` |
| `ancestor-or-self::` | Up | Ancestors + current | `//div/ancestor-or-self::*` |
| `descendant-or-self::` | Down | Descendants + current | `//div/descendant-or-self::*` |
| `self::` | Current | Current node only | `//div/self::div` |
| `attribute::` | Attribute | Attributes of current | `//div/attribute::class` |

!!! info "Shorthand Syntax"
    - `//div` is short for `//descendant-or-self::div`
    - `//div/p` is short for `//div/child::p`
    - `@id` is short for `attribute::id`
    - `..` is short for `parent::node()`

### Practical Axis Examples

```python
# Navigate to parent
await tab.query("//input[@name='email']/parent::div")
await tab.query("//span[@class='error']/..")       # Shorthand

# Find ancestor
await tab.query("//input/ancestor::form")          # First ancestor <form>
await tab.query("//button/ancestor::div[@class='modal']")

# Sibling navigation
await tab.query("//label[text()='Email:']/following-sibling::input")
await tab.query("//h2/following-sibling::p[1]")    # First <p> after <h2>
await tab.query("//h2/following-sibling::p", find_all=True)  # All <p> after <h2>
await tab.query("//button/preceding-sibling::input[last()]")

# Complex relationships
await tab.query("//tr/td[1]/following-sibling::td[2]")  # 3rd cell in first row
await tab.query("//tr/td[1]/following-sibling::td[2]", find_all=True)  # 3rd cell in all rows
```

## XPath Functions

### Text Functions

```python
# Exact text match
await tab.query("//button[text()='Submit']")

# Contains text
await tab.query("//p[contains(text(), 'welcome')]")

# Starts with
await tab.query("//a[starts-with(@href, 'https://')]")

# Text normalization (removes extra whitespace)
await tab.query("//button[normalize-space(text())='Submit']")

# String length
await tab.query("//input[string-length(@value) > 5]")

# Concatenation
await tab.query("//div[concat(@data-first, @data-last)='JohnDoe']")
```

### Numeric Functions

```python
# Position matching
await tab.query("//li[position()=1]")              # First <li>
await tab.query("//li[position() > 3]", find_all=True)  # All <li> after 3rd
await tab.query("//li[last()]")                    # Last <li>
await tab.query("//li[last()-1]")                  # Second to last

# Counting
await tab.query("//ul[count(li) > 5]")             # First <ul> with more than 5 items
await tab.query("//ul[count(li) > 5]", find_all=True)  # All <ul> with > 5 items

# Numeric operations
await tab.query("//div[@data-price > 100]")        # First div with price > 100
await tab.query("//div[@data-price > 100]", find_all=True)  # All divs
await tab.query("//div[number(@data-stock) = 0]")  # First with stock = 0
```

### Boolean Functions

```python
# Boolean logic
await tab.query("//div[@visible='true' and @enabled='true']")  # First match
await tab.query("//input[@type='text' or @type='email']")  # First text or email
await tab.query("//input[@type='text' or @type='email']", find_all=True)  # All
await tab.query("//button[not(@disabled)]")        # First enabled button
await tab.query("//button[not(@disabled)]", find_all=True)  # All enabled buttons

# Existence checks
await tab.query("//div[child::p]")                 # First div with <p> children
await tab.query("//div[child::p]", find_all=True)  # All divs with <p> children
await tab.query("//div[not(child::*)]")            # First empty div
await tab.query("//div[not(child::*)]", find_all=True)  # All empty divs
```

## XPath Predicates

Predicates filter node sets using conditions in square brackets `[]`.

```python
# Position predicates
await tab.query("(//div)[1]")                      # First <div> in document
await tab.query("(//div)[last()]")                 # Last <div> in document
await tab.query("//ul/li[3]")                      # First 3rd <li> in a <ul>
await tab.query("//ul/li[3]", find_all=True)       # All 3rd <li> in each <ul>

# Multiple predicates (AND logic)
await tab.query("//input[@type='text'][@required]")  # First match
await tab.query("//div[@class='product'][position() < 4]", find_all=True)  # First 3

# Attribute predicates
await tab.query("//div[@data-id='123']")
await tab.query("//a[contains(@class, 'button')]")  # First matching link
await tab.query("//input[starts-with(@name, 'user')]")  # First matching input
```

## Real-World Examples: Complex Element Finding

Let's work with a realistic HTML structure to demonstrate advanced selectors.

### Sample HTML Structure

```html
<div class="dashboard">
    <header>
        <h1>User Dashboard</h1>
        <nav class="menu">
            <a href="/home" class="active">Home</a>
            <a href="/profile">Profile</a>
            <a href="/settings">Settings</a>
        </nav>
    </header>
    
    <main>
        <section class="products">
            <h2>Available Products</h2>
            <table id="products-table">
                <thead>
                    <tr>
                        <th>Product Name</th>
                        <th>Price</th>
                        <th>Stock</th>
                        <th>Actions</th>
                    </tr>
                </thead>
                <tbody>
                    <tr data-product-id="101">
                        <td>Laptop</td>
                        <td class="price">$999</td>
                        <td class="stock">15</td>
                        <td>
                            <button class="btn-edit">Edit</button>
                            <button class="btn-delete">Delete</button>
                        </td>
                    </tr>
                    <tr data-product-id="102">
                        <td>Mouse</td>
                        <td class="price">$25</td>
                        <td class="stock">0</td>
                        <td>
                            <button class="btn-edit">Edit</button>
                            <button class="btn-delete" disabled>Delete</button>
                        </td>
                    </tr>
                    <tr data-product-id="103">
                        <td>Keyboard</td>
                        <td class="price">$75</td>
                        <td class="stock">8</td>
                        <td>
                            <button class="btn-edit">Edit</button>
                            <button class="btn-delete">Delete</button>
                        </td>
                    </tr>
                </tbody>
            </table>
        </section>
        
        <section class="user-form">
            <h2>User Information</h2>
            <form id="user-form">
                <div class="form-group">
                    <label for="username">Username:</label>
                    <input type="text" id="username" name="username" required>
                    <span class="error-message" style="display:none;">Invalid username</span>
                </div>
                <div class="form-group">
                    <label for="email">Email:</label>
                    <input type="email" id="email" name="email" required>
                    <span class="error-message" style="display:none;">Invalid email</span>
                </div>
                <div class="form-group">
                    <input type="checkbox" id="newsletter" name="newsletter">
                    <label for="newsletter">Subscribe to newsletter</label>
                </div>
                <button type="submit" class="btn-primary">Save Changes</button>
                <button type="button" class="btn-secondary">Cancel</button>
            </form>
        </section>
    </main>
</div>
```

### Challenge 1: Find Active Navigation Link

**Goal**: Find the currently active navigation link.

```python
# CSS Selector
active_link = await tab.query("nav.menu a.active")

# XPath
active_link = await tab.query("//nav[@class='menu']//a[@class='active']")

# Get its text
text = await active_link.text
print(text)  # "Home"
```

### Challenge 2: Find Edit Button for Specific Product

**Goal**: Find the Edit button for the product "Mouse" (without knowing its row position).

```python
# XPath (recommended for this case)
edit_button = await tab.query(
    "//tr[td[text()='Mouse']]//button[contains(@class, 'btn-edit')]"
)

# Alternative: Using following-sibling
edit_button = await tab.query(
    "//td[text()='Mouse']/following-sibling::td//button[@class='btn-edit']"
)
```

!!! tip "Why XPath Here?"
    CSS selectors can't traverse upward to find the row and then back down to the button. XPath's ability to move freely through the DOM makes this trivial.

### Challenge 3: Find All Products with Price Over $50

**Goal**: Get all table rows where the price is greater than $50.

```python
# XPath with numeric comparison
expensive_products = await tab.query(
    "//tr[number(translate(td[@class='price'], '$,', '')) > 50]",
    find_all=True
)

# More readable version: using contains for simpler cases
# This finds products with price containing specific amounts
products = await tab.query("//tr[contains(td[@class='price'], '$75')]", find_all=True)
```

!!! note "Text to Number Conversion"
    The `translate()` function removes `$` and `,` characters, then `number()` converts to numeric for comparison.

### Challenge 4: Find All Out-of-Stock Products

**Goal**: Find all products where stock is 0.

```python
# XPath
out_of_stock = await tab.query(
    "//tr[td[@class='stock' and text()='0']]",
    find_all=True
)

# Alternative: Find all rows and check stock
rows = await tab.query("//tbody/tr[td[@class='stock']/text()='0']", find_all=True)
```

### Challenge 5: Find Input Field by Its Label

**Goal**: Find the email input by locating its label first.

```python
# XPath using label's 'for' attribute
email_input = await tab.query("//label[text()='Email:']/following-sibling::input")

# Alternative: Using the for attribute
email_input = await tab.query("//input[@id=(//label[text()='Email:']/@for)]")

# More generic: Find by label text
username_input = await tab.query(
    "//label[contains(text(), 'Username')]/following-sibling::input"
)
```

### Challenge 6: Find Error Message Next to Email Field

**Goal**: Get the error message span that appears next to the email input.

```python
# XPath - find error sibling of email input
error_span = await tab.query(
    "//input[@id='email']/following-sibling::span[@class='error-message']"
)

# Alternative: Navigate from parent div
error_span = await tab.query(
    "//input[@id='email']/parent::div//span[@class='error-message']"
)

# Check visibility
is_visible = await error_span.is_visible()
```

### Challenge 7: Find Submit Button (Not Cancel)

**Goal**: Find the submit button, excluding the cancel button.

```python
# CSS Selector (simple)
submit_button = await tab.query("button[type='submit']")
submit_button = await tab.query("button.btn-primary")

# XPath with text
submit_button = await tab.query("//button[text()='Save Changes']")

# XPath excluding others
submit_button = await tab.query(
    "//button[@type='submit' and not(@class='btn-secondary')]"
)
```

### Challenge 8: Find All Required Form Fields

**Goal**: Get all required input fields in the form.

```python
# CSS Selector (clean)
required_fields = await tab.query(
    "#user-form input[required]",
    find_all=True
)

# XPath
required_fields = await tab.query(
    "//form[@id='user-form']//input[@required]",
    find_all=True
)

# Verify
for field in required_fields:
    field_name = await field.get_attribute("name")
    print(f"Required: {field_name}")
```

### Challenge 9: Find First Non-Disabled Delete Button

**Goal**: Find the first delete button that is not disabled.

```python
# CSS Selector
first_enabled_delete = await tab.query("button.btn-delete:not([disabled])")

# XPath
first_enabled_delete = await tab.query(
    "//button[contains(@class, 'btn-delete') and not(@disabled)]"
)

# Get all enabled delete buttons
all_enabled = await tab.query(
    "//button[@class='btn-delete' and not(@disabled)]",
    find_all=True
)
```

### Challenge 10: Find Table Row by Multiple Conditions

**Goal**: Find products with stock > 0 AND price < $100.

```python
# XPath with complex logic
available_affordable = await tab.query(
    """
    //tr[
        number(td[@class='stock']) > 0 
        and 
        number(translate(td[@class='price'], '$', '')) < 100
    ]
    """,
    find_all=True
)

# For each matching product
for row in available_affordable:
    cells = await row.query("td", find_all=True)
    product_name = await cells[0].text
    print(f"Available: {product_name}")
```

### Challenge 11: Navigate Complex Relationships

**Goal**: From a delete button, get the product name in the same row.

```python
# Start with a delete button
delete_button = await tab.query("//tr[@data-product-id='101']//button[@class='btn-delete']")

# Navigate to parent row, then to first cell
product_name_cell = await delete_button.query("./ancestor::tr/td[1]")
product_name = await product_name_cell.text
print(product_name)  # "Laptop"

# Alternative: Get the entire row first
row = await delete_button.query("./ancestor::tr")
product_id = await row.get_attribute("data-product-id")
print(product_id)  # "101"
```

### Challenge 12: Find Checkbox and Its Label Together

**Goal**: Find the newsletter checkbox and verify its label.

```python
# Find checkbox
checkbox = await tab.query("#newsletter")

# Get associated label using 'for' attribute
label = await tab.query("//label[@for='newsletter']")
label_text = await label.text
print(label_text)  # "Subscribe to newsletter"

# Alternative: Navigate from checkbox to label
label = await checkbox.query("//following::label[@for='newsletter']")

# Check if checked
is_checked = await checkbox.is_checked()
```

## Advanced Pattern: Dynamic Selector Building

When dealing with dynamic content, you might need to build selectors programmatically:

```python
async def find_product_by_name(tab, product_name: str):
    """Find a product row by its name dynamically."""
    # Escape quotes in product name to prevent XPath injection
    safe_name = product_name.replace("'", "\\'")
    
    xpath = f"//tr[td[text()='{safe_name}']]"
    return await tab.query(xpath)

async def find_table_cell(tab, row_text: str, column_index: int):
    """Find a specific cell by row content and column position."""
    xpath = f"//tr[td[contains(text(), '{row_text}')]]/td[{column_index}]"
    return await tab.query(xpath)

# Usage
product_row = await find_product_by_name(tab, "Laptop")
price_cell = await find_table_cell(tab, "Laptop", 2)
price = await price_cell.text
print(price)  # "$999"
```

## Performance Comparison

```python
import asyncio
import time

async def benchmark_selectors(tab):
    """Compare CSS vs XPath performance."""
    
    # Warm up
    await tab.query("#products-table")
    
    # Benchmark CSS
    start = time.time()
    for _ in range(100):
        await tab.query("#products-table tbody tr", find_all=True)
    css_time = time.time() - start
    
    # Benchmark XPath
    start = time.time()
    for _ in range(100):
        await tab.query("//table[@id='products-table']//tbody//tr", find_all=True)
    xpath_time = time.time() - start
    
    print(f"CSS: {css_time:.3f}s")
    print(f"XPath: {xpath_time:.3f}s")
    print(f"CSS is {xpath_time/css_time:.2f}x faster")

# Typical results: CSS is 1.2-1.5x faster for simple selectors
```

!!! warning "Performance vs Readability"
    While CSS selectors are generally faster, the difference is usually negligible (milliseconds) for individual queries. Choose the selector that makes your code more readable and maintainable, especially for complex relationships where XPath excels.

## Selector Best Practices

### 1. Prefer Stable Selectors

```python
# Good: Using semantic attributes
await tab.query("#user-email")
await tab.query("[data-testid='submit-button']")
await tab.query("input[name='username']")

# Avoid: Brittle selectors based on structure
await tab.query("div > div > div:nth-child(3) > input")
await tab.query("body > div:nth-child(2) > form > div:first-child")
```

### 2. Use the Simplest Selector That Works

```python
# Good: Simple and efficient
await tab.query("#login-form")
await tab.query(".submit-button")

# Avoid: Over-complicated when unnecessary
await tab.query("//div[@id='content']/descendant::form[@id='login-form']")
```

### 3. Combine find() and query() Appropriately

```python
# Use find() for simple attribute matching
username = await tab.find(id="username")
submit = await tab.find(tag_name="button", type="submit")

# Use query() for complex patterns
active_link = await tab.query("nav.menu a.active")
error_msg = await tab.query("//input[@name='email']/following-sibling::span[@class='error']")
```

### 4. Add Comments for Complex Selectors

```python
# Find the "Edit" button in the row containing product "Laptop"
# XPath: Navigate to row with "Laptop" text, then find edit button
edit_button = await tab.query(
    "//tr[td[text()='Laptop']]//button[@class='btn-edit']"
)
```

## Conclusion

By understanding both CSS selectors and XPath, along with their respective strengths and use cases, you can create robust and maintainable browser automation that handles the complexities of modern web applications. Remember:

- **Use CSS selectors** for simple, performance-critical selections
- **Use XPath** for complex relationships, text matching, and upward navigation
- **Choose stability** over brevity when writing selectors
- **Comment complex queries** to maintain code readability

For more information about how these selectors are used internally by Pydoll, see the [FindElements Mixin](find-elements-mixin.md) documentation.


================================================
FILE: docs/en/deep-dive/index.md
================================================
# Deep Dive: Technical Foundation

**Welcome to the technical heart of Pydoll, where we explore the systems and protocols that power browser automation.**

This section provides comprehensive technical education on web scraping, browser automation, network protocols, and anti-detection techniques. Rather than focusing solely on usage patterns, we explore the underlying mechanisms, from the first TCP packet to the final rendered pixel.

## What Makes This Different

Most automation documentation teaches you **how to use a tool**. This section teaches you **how the internet actually works**, and how to manipulate it at every layer:

- **Network protocols** (TCP/IP, TLS, HTTP/2) - The invisible foundation of every request
- **Browser internals** (CDP, rendering engines, JavaScript contexts) - What happens inside Chrome
- **Detection systems** (fingerprinting, behavioral analysis, proxy detection) - How websites identify bots
- **Evasion techniques** (CDP overrides, consistency enforcement, human mimicry) - How to become undetectable

!!! quote "Philosophy"
    **"Any sufficiently advanced technology is indistinguishable from magic."**
    
    This section aims to demystify browser automation by explaining the underlying systems. Understanding these fundamentals provides better control and predictability in your automation work.

## The Architecture of Knowledge

This section is organized into **five progressive layers**, each building on the previous:

### Core Fundamentals
**[→ Explore Fundamentals](./fundamentals/cdp.md)**

Start at the foundation: understand the protocols and systems that power Pydoll.

- **[Chrome DevTools Protocol](./fundamentals/cdp.md)** - How Pydoll talks to browsers, bypassing WebDriver
- **[Connection Layer](./fundamentals/connection-layer.md)** - WebSocket architecture, async patterns, real-time CDP
- **[Python Type System](./fundamentals/typing-system.md)** - Type safety, TypedDict for CDP, IDE integration

**Why start here**: Understanding CDP and async communication provides the foundation for comprehending all other aspects of browser automation.

---

### Internal Architecture
**[→ Explore Architecture](./architecture/browser-domain.md)**

Climb to the next level: understand how Pydoll's internal components work together.

- **[Browser Domain](./architecture/browser-domain.md)** - Process management, contexts, multi-profile automation
- **[Tab Domain](./architecture/tab-domain.md)** - Tab lifecycle, concurrent operations, iframe handling
- **[WebElement Domain](./architecture/webelement-domain.md)** - Element interactions, shadow DOM, attribute handling
- **[FindElements Mixin](./architecture/find-elements-mixin.md)** - Selector strategies, DOM traversal, optimization
- **[Event Architecture](./architecture/event-architecture.md)** - Reactive event system, callbacks, async dispatch
- **[Browser Requests Architecture](./architecture/browser-requests-architecture.md)** - HTTP in browser context

**Why this matters**: Understanding internal architecture reveals optimization opportunities and design patterns that aren't apparent from surface-level usage.

---

### Network & Security
**[→ Explore Network & Security](./network/index.md)**

Drop down to the protocol layer: understand how data flows across the internet.

- **[Network Fundamentals](./network/network-fundamentals.md)** - OSI model, TCP/UDP, WebRTC leakage
- **[HTTP/HTTPS Proxies](./network/http-proxies.md)** - Application-layer proxying, CONNECT tunneling
- **[SOCKS Proxies](./network/socks-proxies.md)** - Session-layer proxying, UDP support, security
- **[Proxy Detection](./network/proxy-detection.md)** - Anonymity levels, detection techniques, evasion
- **[Building Proxy Servers](./network/build-proxy.md)** - Full HTTP & SOCKS5 implementations
- **[Legal & Ethical](./network/proxy-legal.md)** - GDPR, CFAA, compliance, responsible usage

**Critical insight**: Network characteristics are determined at the OS level. Mismatches between claimed browser identity and network-level fingerprints can be detected by sophisticated anti-bot systems.

---

### Fingerprinting
**[→ Explore Fingerprinting](./fingerprinting/index.md)**

Understanding detection systems and evasion techniques for browser automation.

- **[Network Fingerprinting](./fingerprinting/network-fingerprinting.md)** - TCP/IP, TLS/JA3, p0f, Nmap, Scapy
- **[Browser Fingerprinting](./fingerprinting/browser-fingerprinting.md)** - HTTP/2, Canvas, WebGL, JavaScript APIs
- **[Evasion Techniques](./fingerprinting/evasion-techniques.md)** - CDP overrides, consistency, practical code

**Key insight**: Every connection reveals numerous characteristics (canvas rendering, TCP window size, TLS cipher order). Effective stealth requires consistency across all detection layers.

---

### Practical Guides
**[→ Explore Guides](./guides/selectors-guide.md)**

Apply your knowledge: practical guides for common automation challenges.

- **[CSS Selectors vs XPath](./guides/selectors-guide.md)** - Selector syntax, performance, best practices

**Coming soon**: More practical guides synthesizing the technical knowledge into actionable patterns.

---

## Learning Paths

Different goals require different knowledge. Choose your path:

### Path 1: Stealth Automation
**Goal: Build undetectable scrapers**

1. **[Fingerprinting Overview](./fingerprinting/index.md)** - Understand the detection landscape
2. **[Network Fingerprinting](./fingerprinting/network-fingerprinting.md)** - TCP/IP, TLS signatures
3. **[Browser Fingerprinting](./fingerprinting/browser-fingerprinting.md)** - Canvas, WebGL, HTTP/2
4. **[Evasion Techniques](./fingerprinting/evasion-techniques.md)** - CDP-based countermeasures
5. **[Network & Security](./network/index.md)** - Proxy selection and configuration
6. **[Browser Domain](./architecture/browser-domain.md)** - Context isolation, process management

**Time investment**: 12-16 hours of deep technical learning  
**Payoff**: Ability to bypass sophisticated anti-bot systems

---

### Path 2: Architecture Mastery
**Goal: Contribute to Pydoll or build similar tools**

1. **[CDP Deep Dive](./fundamentals/cdp.md)** - Protocol fundamentals
2. **[Connection Layer](./fundamentals/connection-layer.md)** - WebSocket async patterns
3. **[Event Architecture](./architecture/event-architecture.md)** - Event-driven design
4. **[Browser Domain](./architecture/browser-domain.md)** - Browser management
5. **[Tab Domain](./architecture/tab-domain.md)** - Tab lifecycle
6. **[WebElement Domain](./architecture/webelement-domain.md)** - Element interaction
7. **[Python Type System](./fundamentals/typing-system.md)** - Type safety integration

**Time investment**: 16-20 hours of architectural study  
**Payoff**: Deep understanding of browser automation internals

---

### Path 3: Network Engineering
**Goal: Master proxies, fingerprinting, and network-level stealth**

1. **[Network Fundamentals](./network/network-fundamentals.md)** - OSI model, TCP/UDP, WebRTC
2. **[Network Fingerprinting](./fingerprinting/network-fingerprinting.md)** - TCP/IP signatures, TLS/JA3
3. **[HTTP/HTTPS Proxies](./network/http-proxies.md)** - Application-layer proxying
4. **[SOCKS Proxies](./network/socks-proxies.md)** - Session-layer proxying
5. **[Proxy Detection](./network/proxy-detection.md)** - Anonymity and evasion
6. **[Building Proxy Servers](./network/build-proxy.md)** - Implementation from scratch

**Time investment**: 14-18 hours of network protocol study  
**Payoff**: Complete understanding of network-level anonymity and detection

---

## Prerequisites

This is advanced, technical material. Recommended prerequisites include:

- **Python fundamentals** - Classes, async/await, context managers, decorators
- **Basic networking** - IP addresses, ports, HTTP protocol
- **Pydoll basics** - See [Features](../features/core-concepts.md) and [Getting Started](../index.md)
- **Browser DevTools** - Chrome Inspector, Network tab, Console  

**If you're new to these**, we recommend:
1. Complete the [Features](../features/index.md) section first
2. Practice basic automation with Pydoll
3. Return here when you need deeper understanding

## The Philosophy of Mastery

Web automation involves multiple areas of expertise:

- **Protocol engineering** - Understanding TCP/IP, TLS, HTTP/2
- **Systems programming** - Managing processes, async I/O, WebSockets
- **Security research** - Fingerprinting, detection, evasion
- **Browser internals** - Rendering, JavaScript contexts, CDP
- **Operational security** - Legal compliance, ethical guidelines

Most developers learn these independently, over time. This section consolidates that knowledge by:

1. **Centralizing knowledge** - No more scattered blog posts and academic papers
2. **Providing context** - Every technique explained from first principles
3. **Offering working code** - All examples are production-ready
4. **Citing sources** - Every claim backed by RFCs, documentation, or research
5. **Progressive complexity** - Each section builds on previous knowledge

## Documentation Standards

This documentation represents extensive research, testing, and validation:

- Every protocol detail verified against RFCs
- Every fingerprinting technique tested in production
- Every code example runs without modification
- Every claim cited with authoritative sources
- Every diagram generated from real system behavior

Technical accuracy and practical applicability are prioritized throughout.

## Ethical Use

With this knowledge comes responsibility:

!!! danger "Use Responsibly"
    The techniques described here can serve legitimate automation or malicious purposes. Responsible use includes:
    
    - Respecting website terms of service and robots.txt
    - Implementing rate limiting and respectful crawling
    - Considering whether automation is truly necessary
    - Consulting legal counsel when uncertain
    - Being transparent about your automation when appropriate
    
    Avoid using this knowledge for:
    - Fraud, account abuse, or illegal activities
    - Overwhelming servers with aggressive scraping
    - Harmful activities without understanding consequences  

For detailed guidance, see **[Legal & Ethical Considerations](./network/proxy-legal.md)**.

## Contributing

Found an error? Have a suggestion? See something outdated?

This documentation is a **living project**. Fingerprinting techniques evolve, protocols update, and new evasion methods emerge. We welcome contributions that:

- Correct technical inaccuracies
- Add new fingerprinting techniques
- Update protocol information
- Improve code examples
- Expand coverage of detection systems

See [Contributing](../CONTRIBUTING.md) for guidelines.

---

## Getting Started

Choose a path based on your goals:

**New to deep technical content?**  
→ Start with **[Chrome DevTools Protocol](./fundamentals/cdp.md)** to understand Pydoll's foundation

**Need stealth automation?**  
→ Jump to **[Fingerprinting](./fingerprinting/index.md)** for detection and evasion techniques

**Want network-level control?**  
→ Explore **[Network & Security](./network/index.md)** for proxy architecture and protocols

**Building automation infrastructure?**  
→ Study **[Internal Architecture](./architecture/browser-domain.md)** for design patterns

**Just want to browse?**  
→ Pick any topic from the sidebar, each article is self-contained

---

!!! success "Technical Deep Dive"
    This section provides comprehensive technical knowledge for browser automation, from fundamental protocols to advanced evasion techniques.
    
    Explore at your own pace.


================================================
FILE: docs/en/deep-dive/network/build-proxy.md
================================================
# Building Proxy Servers

This document implements HTTP and SOCKS5 proxy servers from scratch in Python using asyncio. The goal is not production readiness but protocol comprehension: seeing how each byte is parsed, where security boundaries lie, and why certain design decisions exist in real proxy software.

!!! info "Module Navigation"
    - [Network Fundamentals](./network-fundamentals.md): TCP/IP, UDP, WebRTC
    - [HTTP/HTTPS Proxies](./http-proxies.md): Application-layer proxying
    - [SOCKS Proxies](./socks-proxies.md): Session-layer proxying
    - [Proxy Detection](./proxy-detection.md): Detection techniques and evasion

    For practical proxy usage in Pydoll, see [Proxy Configuration](../../features/configuration/proxy.md).

!!! warning "Educational Code"
    These implementations prioritize clarity over robustness. They lack connection limits, access control lists, and many error recovery paths that a production proxy requires. Do not expose them to untrusted networks.

## HTTP Proxy

An HTTP proxy operates in two modes. For plaintext HTTP, it receives the full request (with an absolute-form URL like `GET http://example.com/path HTTP/1.1`), rewrites the request-target to origin-form (`GET /path HTTP/1.1`), connects to the target server, forwards the request, and pipes the response back. For HTTPS, the client sends a `CONNECT host:port` request, the proxy opens a TCP connection to the target, responds with `200 Connection Established`, and then blindly relays bytes in both directions without inspecting the encrypted content.

The implementation below handles both modes. A few things to note as you read through it. The `_pipe_data` method calls `write_eof()` when one side closes, which sends a TCP FIN to the other side. Without this, the tunnel hangs indefinitely because the other `read()` never returns empty bytes. The HTTP forwarding path uses the same piping approach rather than a single `read()` call, because HTTP responses can be arbitrarily large and a fixed-size read would silently truncate them. The request-target rewrite preserves query strings, which `urlparse().path` alone would drop.

```python
import asyncio
import base64
import contextlib
import logging
from urllib.parse import urlparse

logger = logging.getLogger(__name__)


class HTTPProxy:
    """Async HTTP/HTTPS proxy with optional Basic authentication."""

    def __init__(self, host='0.0.0.0', port=8080, username=None, password=None):
        self.host = host
        self.port = port
        self.username = username
        self.password = password

    async def start(self):
        server = await asyncio.start_server(
            self._handle_client, self.host, self.port
        )
        logger.info(f'HTTP proxy listening on {self.host}:{self.port}')
        async with server:
            await server.serve_forever()

    async def _handle_client(self, reader, writer):
        try:
            request_line = await asyncio.wait_for(
                reader.readline(), timeout=30
            )
            if not request_line:
                return

            parts = request_line.decode('latin-1').split()
            if len(parts) != 3:
                writer.write(b'HTTP/1.1 400 Bad Request\r\n\r\n')
                await writer.drain()
                return

            method, url, _ = parts
            headers = await self._read_headers(reader)

            if not self._check_auth(headers):
                writer.write(
                    b'HTTP/1.1 407 Proxy Authentication Required\r\n'
                    b'Proxy-Authenticate: Basic realm="Proxy"\r\n'
                    b'Content-Length: 0\r\n\r\n'
                )
                await writer.drain()
                return

            if method == 'CONNECT':
                await self._handle_connect(url, reader, writer)
            else:
                await self._handle_http(method, url, headers, reader, writer)
        except Exception as e:
            logger.error(f'Client handler error: {e}')
        finally:
            writer.close()
            await writer.wait_closed()

    async def _read_headers(self, reader):
        headers = {}
        while True:
            line = await reader.readline()
            if line in (b'\r\n', b'\n', b''):
                break
            if b':' in line:
                key, value = line.decode('latin-1').split(':', 1)
                headers[key.strip().lower()] = value.strip()
        return headers

    def _check_auth(self, headers):
        if not self.username:
            return True
        auth = headers.get('proxy-authorization', '')
        if not auth.startswith('Basic '):
            return False
        try:
            decoded = base64.b64decode(auth[6:]).decode('utf-8')
            if ':' not in decoded:
                return False
            user, pwd = decoded.split(':', 1)
            return user == self.username and pwd == self.password
        except Exception:
            return False

    async def _handle_connect(self, target, client_reader, client_writer):
        """Establish a blind TCP tunnel for HTTPS."""
        # Parse host:port, handling IPv6 literals like [::1]:443
        if target.startswith('['):
            bracket_end = target.index(']')
            host = target[1:bracket_end]
            port = int(target[bracket_end + 2:])
        elif ':' in target:
            host, port_str = target.rsplit(':', 1)
            port = int(port_str)
        else:
            client_writer.write(b'HTTP/1.1 400 Bad Request\r\n\r\n')
            await client_writer.drain()
            return

        try:
            server_reader, server_writer = await asyncio.open_connection(
                host, port
            )
        except OSError as e:
            logger.error(f'CONNECT failed to {host}:{port}: {e}')
            client_writer.write(b'HTTP/1.1 502 Bad Gateway\r\n\r\n')
            await client_writer.drain()
            return

        client_writer.write(b'HTTP/1.1 200 Connection Established\r\n\r\n')
        await client_writer.drain()

        await asyncio.gather(
            self._pipe(client_reader, server_writer),
            self._pipe(server_reader, client_writer),
        )

    async def _handle_http(self, method, url, headers, client_reader, client_writer):
        """Forward a plaintext HTTP request."""
        parsed = urlparse(url)
        host = parsed.hostname
        port = parsed.port or 80

        # Preserve query string in the request-target
        path = parsed.path or '/'
        if parsed.query:
            path += f'?{parsed.query}'

        try:
            server_reader, server_writer = await asyncio.open_connection(
                host, port
            )
        except OSError as e:
            logger.error(f'HTTP forward failed to {host}:{port}: {e}')
            client_writer.write(b'HTTP/1.1 502 Bad Gateway\r\n\r\n')
            await client_writer.drain()
            return

        # Rewrite request-target from absolute-form to origin-form
        request = f'{method} {path} HTTP/1.1\r\n'

        # Host header must include the port if it is non-standard
        if port != 80:
            request += f'Host: {host}:{port}\r\n'
        else:
            request += f'Host: {host}\r\n'

        # Remove hop-by-hop headers that must not be forwarded
        hop_by_hop = {
            'proxy-authorization', 'proxy-connection',
            'connection', 'keep-alive', 'te', 'trailer', 'upgrade',
        }
        for key, value in headers.items():
            if key not in hop_by_hop:
                request += f'{key}: {value}\r\n'

        # Force Connection: close so the server does not keep-alive,
        # which would prevent the response stream from ending
        request += 'Connection: close\r\n\r\n'

        server_writer.write(request.encode('latin-1'))

        # Forward request body if present
        content_length = int(headers.get('content-length', 0))
        if content_length > 0:
            body = await client_reader.readexactly(content_length)
            server_writer.write(body)

        await server_writer.drain()

        # Pipe the entire response back (not a single fixed-size read)
        while True:
            chunk = await server_reader.read(65536)
            if not chunk:
                break
            client_writer.write(chunk)
            await client_writer.drain()

        server_writer.close()
        await server_writer.wait_closed()

    async def _pipe(self, reader, writer):
        """Bidirectional data relay with proper half-close."""
        try:
            while True:
                data = await reader.read(8192)
                if not data:
                    break
                writer.write(data)
                await writer.drain()
        except (ConnectionResetError, BrokenPipeError, OSError):
            pass
        finally:
            with contextlib.suppress(Exception):
                if writer.can_write_eof():
                    writer.write_eof()
```

A few protocol details worth understanding. HTTP headers are encoded as ISO-8859-1 (Latin-1), not UTF-8. Latin-1 maps every byte value 0-255 to a character, so `decode('latin-1')` never raises a `UnicodeDecodeError`, while `decode('utf-8')` would crash on certain header values. The `Proxy-Authorization` header uses Base64 encoding, but Base64 is not encryption: the credentials travel in cleartext (or rather, trivially reversible encoding) unless the connection between client and proxy is itself protected by TLS. The hop-by-hop headers (`Connection`, `Keep-Alive`, `TE`, `Trailer`, `Upgrade`, `Proxy-Connection`) are meant for the immediate connection between two nodes, not for end-to-end forwarding. RFC 9110 Section 7.6.1 requires proxies to strip them before forwarding.

!!! warning "SSRF Risk"
    This implementation does not validate destination addresses. A client could request `CONNECT 127.0.0.1:6379` to reach a local Redis instance, or `CONNECT 169.254.169.254:80` to access cloud instance metadata (AWS, GCP, Azure). Any proxy exposed to untrusted clients must validate destinations against a deny list of private and link-local ranges (`127.0.0.0/8`, `10.0.0.0/8`, `172.16.0.0/12`, `192.168.0.0/16`, `169.254.0.0/16`, `::1`, `fc00::/7`).

## SOCKS5 Proxy

A SOCKS5 proxy operates at a lower level than HTTP. It uses a binary protocol defined in RFC 1928, consisting of three phases: method negotiation, optional authentication, and the connection request. The proxy does not parse HTTP at all. Once the tunnel is established, it relays raw bytes without understanding what protocol flows through it.

The binary nature of SOCKS5 means every read must receive exactly the expected number of bytes. TCP is a stream protocol and does not guarantee that `read(4)` returns 4 bytes: it may return 1, 2, or 3 bytes depending on network conditions. The implementation below uses `readexactly()` from asyncio, which buffers internally until the requested number of bytes arrives or the connection closes (raising `IncompleteReadError`).

```python
import asyncio
import contextlib
import struct
import logging

logger = logging.getLogger(__name__)


class SOCKS5Proxy:
    """Async SOCKS5 proxy supporting CONNECT with optional auth (RFC 1928)."""

    VERSION = 0x05

    def __init__(self, host='0.0.0.0', port=1080, username=None, password=None):
        self.host = host
        self.port = port
        self.username = username
        self.password = password

    async def start(self):
        server = await asyncio.start_server(
            self._handle_client, self.host, self.port
        )
        logger.info(f'SOCKS5 proxy listening on {self.host}:{self.port}')
        async with server:
            await server.serve_forever()

    async def _handle_client(self, reader, writer):
        try:
            if not await self._negotiate_method(reader, writer):
                return
            if self.username and not await self._authenticate(reader, writer):
                return
            await self._handle_request(reader, writer)
        except (asyncio.IncompleteReadError, ConnectionResetError):
            pass
        except Exception as e:
            logger.error(f'SOCKS5 error: {e}')
        finally:
            writer.close()
            await writer.wait_closed()

    async def _negotiate_method(self, reader, writer):
        """Phase 1: client offers authentication methods, server picks one."""
        version = (await reader.readexactly(1))[0]
        if version != self.VERSION:
            return False

        nmethods = (await reader.readexactly(1))[0]
        methods = await reader.readexactly(nmethods)

        if self.username:
            if 0x02 not in methods:
                writer.write(bytes([self.VERSION, 0xFF]))
                await writer.drain()
                return False
            selected = 0x02
        else:
            selected = 0x00

        writer.write(bytes([self.VERSION, selected]))
        await writer.drain()
        return True

    async def _authenticate(self, reader, writer):
        """Phase 2: username/password sub-negotiation (RFC 1929)."""
        auth_ver = (await reader.readexactly(1))[0]
        if auth_ver != 0x01:
            return False

        ulen = (await reader.readexactly(1))[0]
        username = (await reader.readexactly(ulen)).decode('utf-8')
        plen = (await reader.readexactly(1))[0]
        password = (await reader.readexactly(plen)).decode('utf-8')

        ok = username == self.username and password == self.password
        writer.write(bytes([0x01, 0x00 if ok else 0x01]))
        await writer.drain()
        return ok

    async def _handle_request(self, reader, writer):
        """Phase 3: parse the CONNECT request and establish the tunnel."""
        header = await reader.readexactly(4)
        version, command, _, atyp = header

        # Parse destination address based on address type
        if atyp == 0x01:  # IPv4
            raw = await reader.readexactly(4)
            address = '.'.join(str(b) for b in raw)
        elif atyp == 0x03:  # Domain name
            length = (await reader.readexactly(1))[0]
            address = (await reader.readexactly(length)).decode('ascii')
        elif atyp == 0x04:  # IPv6
            raw = await reader.readexactly(16)
            groups = [f'{raw[i]:02x}{raw[i+1]:02x}' for i in range(0, 16, 2)]
            address = ':'.join(groups)
        else:
            await self._reply(writer, 0x08)
            return

        port = struct.unpack('!H', await reader.readexactly(2))[0]
        logger.info(f'SOCKS5 CONNECT {address}:{port}')

        if command != 0x01:  # Only CONNECT is implemented
            await self._reply(writer, 0x07)
            return

        try:
            server_reader, server_writer = await asyncio.open_connection(
                address, port
            )
        except ConnectionRefusedError:
            await self._reply(writer, 0x05)
            return
        except OSError:
            await self._reply(writer, 0x04)
            return

        # BND.ADDR and BND.PORT should reflect the local socket address.
        # Most clients ignore these for CONNECT, but filling them
        # correctly satisfies RFC 1928.
        local = server_writer.get_extra_info('sockname')
        await self._reply(writer, 0x00, local[0], local[1])

        await asyncio.gather(
            self._pipe(reader, server_writer),
            self._pipe(server_reader, writer),
        )

    async def _reply(self, writer, status, bind_addr='0.0.0.0', bind_port=0):
        """Send a SOCKS5 reply with the given status and bound address."""
        import socket
        try:
            packed_ip = socket.inet_aton(bind_addr)
            atyp = 0x01
        except OSError:
            packed_ip = socket.inet_aton('0.0.0.0')
            atyp = 0x01

        writer.write(bytes([
            self.VERSION, status, 0x00, atyp,
            *packed_ip,
            (bind_port >> 8) & 0xFF, bind_port & 0xFF,
        ]))
        await writer.drain()

    async def _pipe(self, reader, writer):
        try:
            while True:
                data = await reader.read(8192)
                if not data:
                    break
                writer.write(data)
                await writer.drain()
        except (ConnectionResetError, BrokenPipeError, OSError):
            pass
        finally:
            with contextlib.suppress(Exception):
                if writer.can_write_eof():
                    writer.write_eof()
```

When the address type is `0x03` (domain name), the proxy resolves DNS itself via `asyncio.open_connection()`. This is the defining privacy property of SOCKS5 proxying: the client sends the domain name rather than resolving it locally, which prevents DNS queries from leaking to the client's local network. This is the same behavior Chrome relies on when configured with `--proxy-server=socks5://...`, as discussed in [SOCKS Proxies](./socks-proxies.md).

The `_reply` method fills `BND.ADDR` and `BND.PORT` with the actual local socket address after a successful connection, as RFC 1928 requires. Many SOCKS5 implementations return `0.0.0.0:0` here because most clients ignore these fields for CONNECT commands, but filling them correctly costs nothing and avoids a protocol violation.

## Running Both Proxies

```python
async def main():
    http_proxy = HTTPProxy(
        port=8080, username='user', password='pass'
    )
    socks5_proxy = SOCKS5Proxy(
        port=1080, username='user', password='pass'
    )
    await asyncio.gather(http_proxy.start(), socks5_proxy.start())

# asyncio.run(main())
```

You can test them with curl:

```bash
# HTTP proxy
curl -x http://user:pass@localhost:8080 http://httpbin.org/ip

# HTTPS through HTTP proxy (CONNECT tunnel)
curl -x http://user:pass@localhost:8080 https://httpbin.org/ip

# SOCKS5 proxy
curl --socks5 localhost:1080 --proxy-user user:pass https://httpbin.org/ip
```

## What the Code Does Not Handle

These implementations omit several things that production proxies handle. Understanding what is missing is as instructive as understanding what is present.

There are no connection limits. `asyncio.start_server` accepts connections without bound, so a single client opening thousands of connections would exhaust file descriptors. Production proxies use semaphores or connection pools to cap concurrency.

There is no destination validation. Both proxies connect to whatever address the client requests, including `127.0.0.1`, `169.254.169.254` (cloud metadata), and internal network ranges. This is a Server-Side Request Forgery (SSRF) vector. Production proxies maintain deny lists of private and link-local address ranges.

There is no traffic logging or metrics. Production proxies track request counts, bytes transferred, error rates, and latency percentiles, typically exporting to Prometheus or similar systems.

The HTTP proxy does not add a `Via` header. RFC 9110 Section 7.6.3 requires intermediaries to append a `Via` field to forwarded messages. This was omitted for simplicity, but a standards-compliant proxy must include it.

Neither proxy implements graceful shutdown. When the server stops, active tunnels are terminated abruptly rather than being drained. Production proxies track active connections and wait for them to complete (with a deadline) before shutting down.

## Proxy Chaining

Chaining proxies means routing traffic through multiple proxies in sequence: client to proxy A, proxy A to proxy B, proxy B to the target server. Each proxy in the chain only knows its immediate neighbors, not the full path.

The main use case is distributing trust. If you do not fully trust any single proxy provider, chaining two providers means neither one sees both your real IP and your destination. The tradeoff is latency: each hop adds its own connection setup time and forwarding delay. A single proxy typically adds 50 to 100ms of overhead. Two proxies roughly double that, and three proxies can push total overhead past 300ms.

Beyond two hops, the marginal privacy gain diminishes while latency and failure probability increase. Most practical setups use one or two proxies. Tor uses three relays (guard, middle, exit) because its threat model assumes some relays are compromised, but Tor accepts the latency penalty as an explicit design tradeoff.

```
Client --> Proxy A (SOCKS5) --> Proxy B (SOCKS5) --> Target
           sees: client IP          sees: Proxy A IP
           sees: Proxy B addr       sees: target addr
```

Chaining a SOCKS5 proxy through another SOCKS5 proxy works by having proxy A treat proxy B as the target. The client connects to proxy A and sends a CONNECT request for proxy B's address. Once that tunnel is established, the client sends a second SOCKS5 handshake through the tunnel, this time requesting the real target. Proxy A sees traffic flowing to proxy B but cannot read it if the inner connection is encrypted.

## References

- RFC 1928: SOCKS Protocol Version 5 - https://datatracker.ietf.org/doc/html/rfc1928
- RFC 1929: Username/Password Authentication for SOCKS V5 - https://datatracker.ietf.org/doc/html/rfc1929
- RFC 9110: HTTP Semantics - https://www.rfc-editor.org/rfc/rfc9110.html
- RFC 9112: HTTP/1.1 - https://www.rfc-editor.org/rfc/rfc9112.html
- OWASP SSRF Prevention Cheat Sheet - https://cheatsheetseries.owasp.org/cheatsheets/Server_Side_Request_Forgery_Prevention_Cheat_Sheet.html
- mitmproxy (Python HTTPS intercepting proxy) - https://mitmproxy.org/


================================================
FILE: docs/en/deep-dive/network/http-proxies.md
================================================
# HTTP/HTTPS Proxy Architecture

HTTP proxies are the most common proxy protocol on the internet. Nearly every corporate network uses them, and most commercial proxy services offer them as the default option. They operate at Layer 7 (Application) of the OSI model, which means they understand HTTP and can parse, modify, cache, and filter traffic. This same deep integration with the protocol is also their biggest limitation: they can only handle HTTP traffic, they reveal proxy usage through identifiable headers, and they cannot proxy UDP, which leaves WebRTC and DNS vulnerable to leaks.

This document covers how HTTP proxies work at the protocol level, the CONNECT method for HTTPS tunneling, authentication mechanisms, and the implications of modern protocols like HTTP/2 and HTTP/3.

!!! info "Module Navigation"
    - [Network Fundamentals](./network-fundamentals.md): TCP/IP, UDP, OSI model
    - [Network & Security Overview](./index.md): Module introduction
    - [SOCKS Proxies](./socks-proxies.md): Protocol-agnostic alternative
    - [Proxy Detection](./proxy-detection.md): How to avoid detection

    For practical configuration, see [Proxy Configuration](../../features/configuration/proxy.md).

## How HTTP Proxies Work

An HTTP proxy sits between the client and the target server, maintaining two separate TCP connections: one from the client to the proxy, and another from the proxy to the target server. Because the proxy understands HTTP, it can make intelligent decisions about the traffic passing through it.

### Request Flow

When a client is configured to use an HTTP proxy, it sends the full HTTP request to the proxy rather than directly to the target server. The key difference from a direct request is that the request line includes the absolute URI, not just the path. For example, instead of `GET /page HTTP/1.1`, the client sends `GET http://example.com/page HTTP/1.1`. This tells the proxy where to forward the request.

```mermaid
sequenceDiagram
    participant Client as Client Browser
    participant Proxy as HTTP Proxy
    participant Server as Target Server

    Client->>Proxy: GET http://example.com/page HTTP/1.1<br/>Host: example.com<br/>User-Agent: Mozilla/5.0
    Note over Client,Proxy: TCP connection #1

    Note over Proxy: Parse request, check auth,<br/>check cache, apply rules

    Proxy->>Server: GET /page HTTP/1.1<br/>Host: example.com<br/>Via: 1.1 proxy.example.com<br/>X-Forwarded-For: 192.168.1.100
    Note over Proxy,Server: TCP connection #2

    Server->>Proxy: HTTP/1.1 200 OK<br/>[response body]

    Note over Proxy: Cache response if allowed,<br/>filter content, log transaction

    Proxy->>Client: HTTP/1.1 200 OK<br/>Via: 1.1 proxy.example.com<br/>[possibly modified body]
```

The proxy receives the full HTTP request, parses the method, URL, and headers, then decides what to do. It may check authentication credentials, verify the URL against an access control list, look for a cached copy of the resource, and modify headers before forwarding. It then opens a separate TCP connection to the target server and sends the request, potentially with altered headers.

When the response arrives, the proxy can cache it according to HTTP semantics (`Cache-Control`, `ETag`), filter the content for malware or blocked keywords, compress it if the client supports it, and log the transaction before forwarding the response back to the client.

### Proxy Headers and Privacy

HTTP proxies commonly add headers that reveal their presence and the client's real IP address. The `Via` header (RFC 9110) identifies the proxy in the request chain. The `X-Forwarded-For` header contains the original client IP, often forming a chain if multiple proxies are involved. The `X-Forwarded-Proto` header indicates whether the original request was HTTP or HTTPS. Some proxies also add `X-Real-IP` as a simpler alternative to `X-Forwarded-For`.

There is also a standardized `Forwarded` header (RFC 7239) that combines all of this information into a single field, for example `Forwarded: for=192.168.1.100;proto=http;by=proxy.example.com`. In practice, most proxies still use the `X-Forwarded-*` variants since they have broader support.

Legacy clients and some older browsers may also send a `Proxy-Connection: keep-alive` header instead of `Connection: keep-alive` when routing through a proxy. This header is a well-known indicator of proxy usage and a classic detection signal.

!!! danger "Header Detection"
    Detection systems look for the presence of `Via`, `X-Forwarded-For`, or `Forwarded` headers to confirm proxy usage. If `X-Real-IP` does not match the connecting IP, the proxy is confirmed. Sophisticated proxies can strip these headers, but many commercial proxy services leave them in by default. Always verify your proxy's behavior using a tool like [browserleaks.com/ip](https://browserleaks.com/ip).

### Capabilities and Limitations

Because HTTP proxies parse and understand the HTTP protocol, they can read and modify every part of an unencrypted HTTP request and response: URLs, headers, cookies, and bodies. This lets them cache responses intelligently, filter content by URL or keyword, inject or strip headers, authenticate users, and log all traffic in detail.

The trade-off is that this deep coupling with HTTP means the proxy is limited to HTTP traffic. It cannot natively proxy FTP, SSH, SMTP, or custom protocols (though the CONNECT method, described below, provides a tunneling workaround for any TCP-based protocol). It has no support for UDP, which means WebRTC, DNS queries, and QUIC/HTTP/3 traffic bypass it entirely. And inspecting HTTPS content requires TLS termination, which breaks end-to-end encryption.

## The CONNECT Method: HTTPS Tunneling

The CONNECT method (RFC 9110, Section 9.3.6) solves a fundamental problem: how can an HTTP proxy forward encrypted traffic it cannot read? The answer is to become a blind TCP tunnel.

When a client wants to access an HTTPS site through a proxy, it sends a `CONNECT` request asking the proxy to establish a raw TCP connection to the destination. Once the proxy confirms the tunnel is established, it stops being an HTTP proxy entirely and becomes a transparent TCP relay at Layer 4, forwarding bytes in both directions without interpreting them.

```mermaid
sequenceDiagram
    participant Client
    participant Proxy
    participant Server

    Client->>Proxy: CONNECT example.com:443 HTTP/1.1<br/>Host: example.com:443<br/>Proxy-Authorization: Basic dXNlcjpwYXNz
    Note over Client,Proxy: Unencrypted HTTP request

    Proxy->>Server: TCP three-way handshake
    Note over Proxy,Server: TCP connection established

    Proxy->>Client: HTTP/1.1 200 Connection Established

    Note right of Proxy: Proxy is now a transparent<br/>TCP relay (Layer 4)

    Client->>Server: TLS ClientHello
    Note over Client,Server: TLS handshake (proxy sees<br/>this in plaintext)
    Server->>Client: TLS ServerHello, Certificate

    Client->>Server: Encrypted HTTP/2 request
    Server->>Client: Encrypted HTTP/2 response

    Note over Proxy: Proxy blindly forwards<br/>all encrypted data
```

### The CONNECT Request

The CONNECT request is minimal. The method is `CONNECT`, the request URI is the destination `host:port` (not a path), and it includes authentication if the proxy requires it. There is no request body. The proxy validates the credentials, checks its access control rules, and opens a TCP connection to the specified host and port. If everything succeeds, it sends back `HTTP/1.1 200 Connection Established` followed by a blank line. After that blank line, the HTTP conversation ends and the proxy becomes a transparent relay.

### Visibility After CONNECT

Once the tunnel is established, the proxy's visibility is limited. It knows the destination hostname and port from the CONNECT request. It can observe connection timing (when it was established and for how long), the volume of data transferred in each direction, and when either side terminates the connection. It can also observe the TLS handshake that follows, which is particularly relevant.

The TLS ClientHello message, sent immediately after the tunnel is established, is transmitted in plaintext. The proxy (and any network observer) can directly read the TLS version, the full list of supported cipher suites, the extensions and their parameters, the elliptic curves offered, and the SNI (Server Name Indication) extension that contains the target hostname. This is exactly the information used for TLS fingerprinting (JA3/JA4). See [Network Fingerprinting](../fingerprinting/network-fingerprinting.md) for details.

What the proxy cannot see is the encrypted application data: HTTP methods, URLs, request and response headers, cookies, session tokens, and response content are all encrypted inside the TLS tunnel.

!!! note "SNI and Encrypted Client Hello (ECH)"
    The SNI extension in the ClientHello reveals the target hostname in plaintext, which is redundant with the CONNECT request in the proxy scenario but relevant for other network observers. Encrypted Client Hello (ECH), currently being deployed, aims to encrypt the SNI to address this leak. However, ECH adoption is still limited and requires both client and server support.

### CONNECT for Non-HTTPS Protocols

While CONNECT is primarily used for HTTPS, it can tunnel any TCP-based protocol. An IMAPS connection to port 993, an SSH connection to port 22, or FTP-over-TLS to port 990 all work through a CONNECT tunnel. The proxy does not need to understand these protocols because after the tunnel is established, it is simply relaying bytes.

In practice, many corporate proxies restrict CONNECT to port 443 (HTTPS) to prevent abuse. Attempting `CONNECT example.com:22` for SSH will often return `403 Forbidden`.

### The HTTPS Dilemma

HTTP proxies face a fundamental choice with encrypted traffic. With the CONNECT tunnel approach, end-to-end encryption is preserved, the client verifies the server's certificate directly, and certificate pinning works normally. But the proxy cannot inspect, cache, or filter the encrypted content.

The alternative is TLS termination (MITM), where the proxy decrypts HTTPS traffic, inspects the content, and re-encrypts it before forwarding. This requires installing the proxy's CA certificate on the client, breaks end-to-end encryption, and is detectable through certificate pinning and Certificate Transparency logs. Most corporate proxies use this approach for content filtering and security scanning, while privacy-focused proxies use blind CONNECT tunnels.

For web scraping and automation, this distinction matters for TLS fingerprinting. If the proxy performs TLS termination, the TLS fingerprint that the target server sees belongs to the proxy, not your browser. If you are using a CONNECT tunnel, the fingerprint is preserved end-to-end. Depending on your evasion strategy, one approach may be preferable to the other.

| Aspect | HTTP (no CONNECT) | HTTPS (CONNECT tunnel) |
|--------|-------------------|------------------------|
| Proxy visibility | Full HTTP request/response | Only destination host:port + TLS ClientHello |
| Encryption | None (unless TLS termination) | End-to-end TLS |
| Caching | Yes, based on HTTP semantics | No (encrypted content) |
| Content filtering | Yes | No (only hostname-based blocking) |
| Header modification | Yes | No (encrypted headers) |
| URL visibility | Full URL | Only hostname (via CONNECT and SNI) |
| Protocol support | HTTP only | Any protocol over TCP |

## HTTPS Proxies (TLS to Proxy)

A distinction worth clarifying is the difference between proxying HTTPS traffic and connecting to the proxy itself over HTTPS. When you configure `--proxy-server=https://proxy:port` instead of `http://proxy:port`, the connection between your browser and the proxy is encrypted with TLS. This protects your proxy authentication credentials from being sniffed on the local network and hides even the CONNECT hostname from local observers, since it is encapsulated inside the TLS connection to the proxy.

Chrome supports this via the `https://` scheme in `--proxy-server`. It is particularly important when using a proxy over untrusted networks (public Wi-Fi, shared hosting), where the connection between you and the proxy is the weakest link.

## Authentication

HTTP proxy authentication uses standard HTTP status codes and headers, following RFC 9110. When a proxy requires authentication, it responds with `407 Proxy Authentication Required` and a `Proxy-Authenticate` header indicating which authentication schemes it supports. The client then retransmits the request with a `Proxy-Authorization` header containing the credentials.

### Authentication Schemes

There are several authentication schemes, each with different security characteristics.

**Basic** (RFC 7617) is the simplest. The client sends `Proxy-Authorization: Basic <base64(username:password)>`. Base64 is an encoding, not encryption, so credentials are trivially reversible. Anyone who intercepts the header can decode it instantly and reuse it indefinitely since there is no replay protection. Basic auth should only be used over TLS-encrypted connections.

**Digest** (RFC 7616) uses a challenge-response mechanism. The proxy sends a random nonce, and the client computes a hash of the username, password, nonce, and request URI. The password is never transmitted, and the nonce provides replay protection. The original version uses MD5, which is fast enough to brute-force efficiently, though RFC 7616 added SHA-256 support. Digest auth is rarely implemented by modern proxy services.

**NTLM** is Microsoft's proprietary challenge-response protocol, common in Windows enterprise environments. It uses a three-step negotiation (Type 1 negotiation, Type 2 challenge, Type 3 authentication) and integrates with Active Directory for single sign-on. NTLMv1 uses DES (broken), and NTLMv2 uses HMAC-MD5 (considered weak by modern standards). Microsoft recommends Kerberos over NTLM for new deployments. NTLM is connection-bound, which means it breaks with HTTP/2 multiplexing.

**Negotiate** (RFC 4559) uses SPNEGO to select between Kerberos and NTLM, preferring Kerberos. Kerberos offers the strongest security (AES encryption, mutual authentication, time-limited tickets) but requires Active Directory infrastructure, domain-joined machines, and accurate clock synchronization. In browser automation, Kerberos is difficult to configure programmatically.

| Scheme | Security | Mechanism | Practical Notes |
|--------|----------|-----------|-----------------|
| Basic | Low | Base64-encoded credentials | Universal support. Only use over TLS. |
| Digest | Medium | Challenge-response with MD5/SHA-256 | Replay protection via nonce. Rarely implemented. |
| NTLM | Medium | Challenge-response (NT hash) | Windows SSO. Proprietary, known vulnerabilities. |
| Negotiate | High | Kerberos/SPNEGO | Strongest. Requires Active Directory. |

### Authentication in Pydoll

Chrome does not support inline proxy credentials in the `--proxy-server` flag. Writing `--proxy-server=http://user:pass@proxy:port` will not work: Chrome silently ignores the `user:pass` portion and connects without authentication.

Pydoll solves this transparently through its `ProxyManager`. When you provide a proxy URL with embedded credentials, Pydoll extracts the username and password, strips them from the URL before passing it to Chrome, and uses the CDP Fetch domain to intercept `407 Proxy Authentication Required` responses and automatically supply the credentials via `Fetch.continueWithAuth`. This approach works for all authentication schemes that Chrome supports (Basic, Digest, NTLM, Negotiate) without Pydoll needing to implement the protocol-specific logic.

```python
from pydoll.browser import Chrome
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
# Pydoll extracts credentials, cleans the URL, and handles 407 via CDP
options.add_argument('--proxy-server=http://user:pass@proxy.example.com:8080')

async with Chrome(options=options) as browser:
    tab = await browser.start()
    await tab.go_to('https://example.com')
```

!!! tip "Authentication Best Practices"
    Always use TLS-encrypted proxy connections (HTTPS proxy or SSH tunnel) to protect credentials in transit. Prefer Bearer tokens for API proxies since they are revocable and time-limited. Never use Basic auth over an unencrypted HTTP connection to the proxy. Do not hardcode credentials in source code; use environment variables instead.

## Modern Protocols and Proxying

### HTTP/2

HTTP/2 introduced multiplexing, binary framing, and HPACK header compression, which fundamentally change how proxies handle connections. In HTTP/1.1, each request occupies a connection sequentially (pipelining exists but is disabled in practice, so browsers work around this by opening six parallel connections per host). In HTTP/2, a single TCP connection carries multiple concurrent streams, each with its own request and response.

For proxies, this means managing stream IDs, priorities, and flow control windows on both sides of the connection. The proxy must translate between stream IDs on the client side and the server side, maintain priority trees, and handle flow control per-stream. This is significantly more complex than the simple request-response forwarding of HTTP/1.1.

From a fingerprinting perspective, HTTP/2 stream metadata (window sizes, priority settings, header ordering within HPACK) can fingerprint individual clients even when multiple users share the same proxy.

| Feature | HTTP/1.1 | HTTP/2 |
|---------|----------|--------|
| Connections | Sequential per connection (browsers open 6 in parallel) | Multiple concurrent streams over one connection |
| Multiplexing | No (head-of-line blocking) | Yes (stream-level only) |
| Header Compression | None | HPACK |
| Proxy Complexity | Simple request/response forwarding | Stream ID mapping, priority management |

In HTTP/2, the CONNECT method was extended by RFC 8441 to support a `:protocol` pseudo-header, enabling WebSocket tunneling and other protocol upgrades directly within HTTP/2 streams without requiring separate connections.

### HTTP/3 and QUIC

HTTP/3 runs over QUIC (RFC 9000), which is a UDP-based transport protocol. This introduces fundamental challenges for HTTP proxies. Traditional HTTP proxies operate over TCP and cannot handle QUIC's UDP traffic. QUIC connections can survive IP changes (connection migration), complicating proxy session management. And QUIC encrypts nearly everything, including transport-level metadata that was previously visible.

Proxying QUIC requires CONNECT-UDP (RFC 9298), a new method for establishing UDP tunnels through HTTP proxies. Most traditional proxies, including many commercial services, do not support this yet. Browsers fall back to HTTP/2 over TCP when the proxy does not support QUIC, which means more metadata may leak than expected if you were relying on HTTP/3's encrypted transport.

In automation scenarios, consider disabling QUIC with the `--disable-quic` Chrome flag to force HTTP/2 over TCP. This ensures all traffic passes through your proxy and eliminates the risk of UDP-based leaks from QUIC.

| Aspect | TCP + TLS (HTTP/1.1, HTTP/2) | QUIC/UDP (HTTP/3) |
|--------|------------------------------|-------------------|
| Transport | TCP (connection-oriented) | UDP (connectionless) |
| Handshake | Separate TCP + TLS (2 RTT) | Combined (0-1 RTT) |
| Head-of-line blocking | Yes (TCP level) | No (stream-level only) |
| Connection migration | Not supported | Supported (survives IP changes) |
| Proxy compatibility | Excellent | Limited (requires UDP relay support) |

!!! warning "Protocol Downgrade"
    When a proxy does not support HTTP/3, the browser silently falls back to HTTP/2 or HTTP/1.1. This downgrade can expose metadata (headers, timing patterns) that HTTP/3 would have encrypted. Monitor your traffic to understand your actual protocol version, and be aware that HTTP/3 adoption varies by region and CDN.

## Summary

HTTP proxies provide rich functionality at the cost of limited scope and privacy concerns. They can inspect, cache, and filter HTTP traffic, but they cannot handle non-HTTP protocols, UDP traffic, or HTTPS content without breaking encryption. Their presence is revealed through identifiable headers unless explicitly stripped.

For automation, the CONNECT tunnel is the most relevant feature: it preserves end-to-end TLS encryption while giving the proxy only hostname-level visibility. Pydoll handles proxy authentication transparently through the CDP Fetch domain, supporting all schemes Chrome implements.

### HTTP Proxy vs SOCKS5

| Need | HTTP Proxy | SOCKS5 |
|------|------------|--------|
| Content filtering | Yes | No |
| URL-based blocking | Yes | No (only IP:port) |
| Caching | Yes | No |
| UDP support | No | Yes |
| Protocol flexibility | HTTP only (CONNECT for TCP tunneling) | Any TCP/UDP |
| Privacy | Low (parses HTTP, adds revealing headers) | Medium (does not parse or modify traffic, but unencrypted content is still visible to operator) |
| DNS resolution | Proxy resolves (remote) | Depends (SOCKS5: typically client resolves, SOCKS5h: proxy resolves. Chrome always resolves remotely for SOCKS5.) |

For corporate environments that need content control and caching, HTTP proxies are the right choice. For privacy-focused automation, SOCKS5 offers better stealth and protocol flexibility. For maximum security, use SOCKS5 over an SSH tunnel or VPN.

**Next steps:**

- [SOCKS Proxies](./socks-proxies.md): Protocol-agnostic, session-layer proxying
- [Network Fundamentals](./network-fundamentals.md): TCP/IP, UDP, WebRTC
- [Proxy Detection](./proxy-detection.md): How proxies are detected and how to avoid it
- [Proxy Configuration](../../features/configuration/proxy.md): Practical Pydoll proxy setup
- [Network Fingerprinting](../fingerprinting/network-fingerprinting.md): TCP/IP and TLS fingerprinting

## References

- RFC 9110: HTTP Semantics (2022, replaces RFC 7230-7237) - https://www.rfc-editor.org/rfc/rfc9110.html
- RFC 9112: HTTP/1.1 (2022) - https://www.rfc-editor.org/rfc/rfc9112.html
- RFC 9113: HTTP/2 (2022, replaces RFC 7540) - https://www.rfc-editor.org/rfc/rfc9113.html
- RFC 9114: HTTP/3 (2022) - https://www.rfc-editor.org/rfc/rfc9114.html
- RFC 9000: QUIC Transport Protocol (2021) - https://www.rfc-editor.org/rfc/rfc9000.html
- RFC 9298: Proxying UDP in HTTP (CONNECT-UDP, 2022) - https://www.rfc-editor.org/rfc/rfc9298.html
- RFC 8441: Bootstrapping WebSockets with HTTP/2 (2018) - https://www.rfc-editor.org/rfc/rfc8441.html
- RFC 7617: Basic Authentication (2015) - https://www.rfc-editor.org/rfc/rfc7617.html
- RFC 7616: Digest Authentication (2015) - https://www.rfc-editor.org/rfc/rfc7616.html
- RFC 7239: Forwarded HTTP Extension (2014) - https://www.rfc-editor.org/rfc/rfc7239.html
- RFC 4559: Negotiate Authentication (2006) - https://www.rfc-editor.org/rfc/rfc4559.html
- MDN Web Docs: Proxy servers and tunneling - https://developer.mozilla.org/en-US/docs/Web/HTTP/Proxy_servers_and_tunneling
- Chrome DevTools Protocol: Fetch domain - https://chromedevtools.github.io/devtools-protocol/tot/Fetch/


================================================
FILE: docs/en/deep-dive/network/index.md
================================================
# Network & Security Deep Dive

**Welcome to the foundation of modern internet communication, the battleground of anonymity, detection, and evasion.**

Network protocols are the invisible infrastructure that powers every web request, browser connection, and automation script. Understanding them deeply transforms you from a **tool user** into a **protocol engineer** capable of navigating the most sophisticated anti-bot systems.

## Why Network Architecture Matters

When you run `tab.go_to('https://example.com')`, a complex symphony of protocols springs into action:

1. **DNS resolution** translates the domain to an IP address (potentially leaking your intent)
2. **TCP handshake** establishes connection (revealing your OS through packet characteristics)
3. **TLS negotiation** secures the channel (fingerprinting your browser via cipher suites)
4. **HTTP/2 request** fetches the page (exposing browser version through SETTINGS frames)
5. **WebRTC discovery** may probe your real IP (bypassing your VPN entirely)

**Every single step is an opportunity for detection or evasion.**

!!! danger "The Network Layer Cannot Lie"
    Unlike browser-level characteristics (which JavaScript can modify), network-level fingerprints are **burned into the OS kernel and TCP/IP stack**. A mismatch here like a Chrome browser sending Linux TCP options while claiming to be Windows is instantly fatal to stealth automation.

## The Architecture of Internet Privacy

This module explores the **technical foundations** that make privacy possible (and breakable) on the modern internet:

### The OSI Model Reality

```mermaid
graph TB
    subgraph "Application Layer 7"
        HTTP[HTTP/HTTPS Headers]
        DNS[DNS Queries]
    end
    
    subgraph "Presentation Layer 6"
        TLS[TLS/SSL Fingerprinting]
        Ciphers[Cipher Suites, Extensions]
    end
    
    subgraph "Session/Transport Layers 5-4"
        SOCKS[SOCKS Proxy Protocol]
        TCP[TCP Window, Options, ISN]
    end
    
    subgraph "Network Layer 3"
        IP[IP TTL, Fragmentation]
        Routing[Packet Routing, Hops]
    end
    
    HTTP --> TLS
    DNS --> TLS
    TLS --> SOCKS
    Ciphers --> TCP
    SOCKS --> IP
    TCP --> Routing
```

**Each layer is both a shield and a vulnerability:**

- **Layer 7 (Application)**: Proxies can read and modify your HTTP traffic
- **Layer 6 (Presentation)**: TLS encryption protects content but leaks metadata
- **Layer 4 (Transport)**: TCP characteristics betray your operating system
- **Layer 3 (Network)**: IP addresses reveal your physical location

## What You'll Master

This module is structured as a **technical progression** from fundamentals to advanced exploitation:

### 1. Network Fundamentals
**[Network Fundamentals](./network-fundamentals.md)**

Build the foundation: understand the protocols that power the internet and how they reveal, or hide, your identity.

- **OSI Model layers** and their fingerprinting implications
- **TCP vs UDP**: Why your proxy might leak UDP traffic
- **WebRTC IP leakage**: The hidden threat in modern browsers
- **Network stack characteristics**: TTL, window size, option ordering

**Why start here**: Without this foundation, proxy configuration is **cargo cult programming**, copying commands without understanding why they work (or don't).

### 2. HTTP/HTTPS Proxies
**[HTTP/HTTPS Proxies](./http-proxies.md)**

Master the most common proxy protocol and understand its fundamental limitations.

- **HTTP proxy operation**: Request forwarding, caching, header injection
- **CONNECT tunneling**: How HTTPS "tunnels" through HTTP proxies
- **HTTP/2 complexities**: Multiplexing, stream priorities, SETTINGS fingerprinting
- **HTTP/3 and QUIC**: UDP-based proxying challenges
- **Authentication schemes**: Basic, Digest, NTLM, Bearer tokens

**Critical insight**: HTTP proxies operate at Layer 7, they can **read, modify, and log** your unencrypted traffic. For true privacy, you need encryption **before** the proxy sees your data.

### 3. SOCKS Proxies
**[SOCKS Proxies](./socks-proxies.md)**

Understand why SOCKS5 is the **gold standard** for privacy-conscious automation.

- **SOCKS4 vs SOCKS5**: Protocol evolution and capabilities
- **SOCKS5 handshake**: Binary protocol deep dive with packet structures
- **UDP support**: Gaming, VoIP, and WebRTC over SOCKS5
- **DNS resolution**: Why proxy-side DNS prevents leaks
- **Why SOCKS5 > HTTP proxies**: Protocol-level comparison

**Key advantage**: SOCKS operates at Layer 5 (Session), **below** the application layer. It can't read your HTTP traffic, only see destination IPs, vastly reducing the trust surface area.

### 4. Proxy Detection
**[Proxy Detection & Anonymity](./proxy-detection.md)**

Learn how websites **detect proxy usage** and how to evade detection.

- **Anonymity levels**: Transparent, anonymous, elite proxies
- **IP reputation databases**: How your datacenter IP betrays you
- **Header analysis**: X-Forwarded-For, Via, Forwarded headers
- **Consistency checks**: DNS reverse lookup, geolocation mismatches
- **Network fingerprinting integration**: Combining proxy detection with TCP/TLS analysis

**Harsh reality**: Most "anonymous" proxies are trivially detectable. True stealth requires **elite residential proxies** + **consistent browser fingerprinting** + **human-like behavior**.

### 5. Building Proxy Servers
**[Building Your Own Proxy](./build-proxy.md)**

Implement HTTP and SOCKS5 proxies from scratch in Python, the ultimate learning experience.

- **HTTP proxy server**: Complete async implementation with authentication
- **SOCKS5 proxy server**: Binary protocol handling, TCP tunneling
- **Proxy chaining**: Layered anonymity (and latency tradeoffs)
- **Rotating proxy pools**: Health checking, failover, load balancing
- **Advanced topics**: Transparent proxies, MITM SSL interception

**Why build your own**: Understanding implementation details reveals **attack vectors** and **optimization opportunities** invisible from the outside.

### 6. Legal & Ethical Considerations
**[Legal & Ethical Guidelines](./proxy-legal.md)**

Navigate the legal minefield of proxy usage and web automation.

- **Regulatory compliance**: GDPR, CFAA, international laws
- **Terms of Service**: What constitutes violation
- **Ethical guidelines**: robots.txt, rate limiting, transparency
- **Case studies**: Legal precedents (hiQ vs LinkedIn, QVC vs Resultly)
- **When to avoid proxies**: High-risk scenarios

**Disclaimer**: This is **educational information**, not legal advice. The law varies wildly by jurisdiction and use case. Consult qualified counsel.

## The Proxy Paradox

Here's the uncomfortable truth about proxies:

!!! warning "Proxies Don't Make You Anonymous. They Make You **Different**"
    A proxy changes your IP address, but it also:
    
    - Adds **latency** (detectible via timing analysis)
    - Resets **TTL** values (revealing proxy hops)
    - Introduces **TCP fingerprint** mismatches (proxy OS ≠ your OS)
    - May inject **headers** (X-Forwarded-For, Via)
    - Creates **geolocation** inconsistencies (browser timezone ≠ IP location)
    
    Proxies are a **tool**, not a solution. True stealth requires **holistic consistency**.

## Prerequisites

This is **advanced material**. You should be comfortable with:

Basic networking concepts (IP addresses, ports, protocols)  
TCP/IP fundamentals (three-way handshake, packets, routing)  
Asynchronous Python programming (asyncio, async/await)  
Pydoll basics (see [Core Concepts](../../features/core-concepts.md))  

**If you're new to networking**, we highly recommend:

1. Read a TCP/IP fundamentals guide first
2. Experiment with Wireshark to visualize network traffic
3. Try the code examples with packet captures running
4. Build the proxy servers and test them locally

## Integration with Other Modules

Network architecture doesn't exist in isolation. It integrates deeply with:

- **[Fingerprinting](../fingerprinting/network-fingerprinting.md)**: How TCP/IP and TLS characteristics identify you
- **[Browser Configuration](../../features/configuration/browser-preferences.md)**: Aligning browser behavior with proxy characteristics
- **[Connection Layer](../fundamentals/connection-layer.md)**: How Pydoll manages WebSocket connections over proxies

## The Learning Path

We recommend this progression:

**Phase 1: Foundation**

1. Read [Network Fundamentals](./network-fundamentals.md)
2. Understand OSI model and protocol layering
3. Learn about WebRTC leaks and UDP tunneling

**Phase 2: Protocol Deep Dive**

4. Study [HTTP/HTTPS Proxies](./http-proxies.md)
5. Master [SOCKS Proxies](./socks-proxies.md)
6. Compare protocols and understand tradeoffs

**Phase 3: Adversarial Thinking**

7. Explore [Proxy Detection](./proxy-detection.md)
8. Learn detection techniques from the defender's perspective
9. Apply evasion strategies

**Phase 4: Hands-On Implementation**

10. Build proxy servers from [Building Proxies](./build-proxy.md)
11. Capture and analyze traffic with Wireshark
12. Test proxy chains and rotation strategies

**Phase 5: Operational Security**

13. Review [Legal & Ethical](./proxy-legal.md) guidelines
14. Understand compliance requirements
15. Develop responsible automation policies


## The Philosophy

Network and security knowledge is **foundational power**. Unlike framework-specific skills (which become obsolete), protocol knowledge is **timeless**:

- TCP hasn't fundamentally changed since RFC 793 (1981)
- TLS builds on concepts from SSL (1995)
- HTTP/2 (2015) and HTTP/3 (2022) are evolutions, not revolutions

Master these fundamentals once, and you'll understand **every network-based system** you encounter for the rest of your career.

## Ethical Commitment

Before proceeding, acknowledge:

I understand proxies can be used for both legitimate and malicious purposes  
I will respect website terms of service and robots.txt  
I will implement rate limiting and respectful crawling  
I will not use this knowledge for fraud, abuse, or illegal activities  
I will consult legal counsel when uncertain about compliance  

**With great power comes great responsibility.** Use this knowledge wisely.

---

## Ready to Begin?

Start your journey with **[Network Fundamentals](./network-fundamentals.md)** to build the foundation, then progress through the modules in order. Each document builds on the previous, creating a comprehensive understanding of network architecture for automation.

---

!!! info "Documentation Status"
    This module synthesizes knowledge from RFCs, protocol specifications, security research, and real-world testing. Every code example is production-ready. If you find inaccuracies or have improvements, contributions are welcome.

## Quick Navigation

**Core Protocols:**

- [Network Fundamentals](./network-fundamentals.md) - TCP/IP, UDP, WebRTC
- [HTTP/HTTPS Proxies](./http-proxies.md) - Application-layer proxying
- [SOCKS Proxies](./socks-proxies.md) - Session-layer proxying

**Advanced Topics:**

- [Proxy Detection](./proxy-detection.md) - Anonymity and evasion
- [Building Proxies](./build-proxy.md) - Implementation from scratch
- [Legal & Ethical](./proxy-legal.md) - Compliance and responsibility

**Related Modules:**

- [Fingerprinting](../fingerprinting/index.md) - Detection techniques
- [Browser Configuration](../../features/configuration/browser-options.md) - Practical setup


================================================
FILE: docs/en/deep-dive/network/network-fundamentals.md
================================================
# Network Fundamentals

This document covers the foundational network protocols that power the internet and how they can expose or protect your identity in automation scenarios. A working understanding of TCP, UDP, the OSI model, and WebRTC will make proxy configuration far less mysterious and far more effective.

!!! info "Module Navigation"
    - [Network & Security Overview](./index.md): Module introduction and learning path
    - [HTTP/HTTPS Proxies](./http-proxies.md): Application-layer proxying
    - [SOCKS Proxies](./socks-proxies.md): Session-layer proxying

    For practical Pydoll usage, see [Proxy Configuration](../../features/configuration/proxy.md) and [Browser Options](../../features/configuration/browser-options.md).

## The Network Stack

Every HTTP request your browser makes travels through a layered network stack. Each layer has specific responsibilities, protocols, and security implications. Proxies operate at different layers, and the layer determines what the proxy can see, modify, and hide. Network characteristics at lower layers can fingerprint your real system even through proxies, so understanding the stack helps you see where identity leaks happen and how to prevent them.

### The OSI Model

The OSI (Open Systems Interconnection) model, developed by ISO in 1984, provides a conceptual framework for understanding how network protocols interact. Real-world networks use the TCP/IP model (which predates OSI and has only 4 layers), but OSI terminology remains the standard way to describe where proxies operate and what they can access.

```mermaid
graph TD
    L7[Layer 7: Application - HTTP, FTP, SMTP, DNS]
    L6[Layer 6: Presentation - Encryption, Compression]
    L5[Layer 5: Session - SOCKS]
    L4[Layer 4: Transport - TCP, UDP]
    L3[Layer 3: Network - IP, ICMP]
    L2[Layer 2: Data Link - Ethernet, WiFi]
    L1[Layer 1: Physical - Cables, Radio Waves]

    L7 --> L6 --> L5 --> L4 --> L3 --> L2 --> L1
```

Layer 7 (Application) is where user-facing protocols live: HTTP, HTTPS, FTP, SMTP, and DNS all operate here. This layer contains the actual data your application cares about, such as HTML documents, JSON responses, and file transfers. HTTP proxies operate at this layer, which gives them full visibility into request and response content.

Layer 6 (Presentation) handles data format translation, encryption, and compression. SSL/TLS is commonly associated with this layer for its encryption role, though in practice TLS straddles Layers 4 through 6 and does not map cleanly to any single OSI layer. What matters for automation is that HTTPS encryption happens here, encrypting Layer 7 data before it moves down the stack.

Layer 5 (Session) manages connections between applications. SOCKS proxies operate here, below the application layer but above transport. This position makes SOCKS protocol-agnostic: it can proxy any Layer 7 protocol (HTTP, FTP, SMTP, SSH) without needing to understand their specifics.

Layer 4 (Transport) provides end-to-end data delivery. TCP (connection-oriented, reliable) and UDP (connectionless, fast) are the dominant protocols here. This layer handles port numbers, flow control, and error correction. All proxies ultimately rely on Layer 4 for actual data transmission.

Layer 3 (Network) handles routing and addressing between networks. IP (Internet Protocol) operates here, managing IP addresses and routing decisions. This is where your real IP address lives, and where proxies aim to substitute it.

Layer 2 (Data Link) manages communication on the same physical network segment. Ethernet, Wi-Fi, and PPP operate here, handling MAC addresses and frame transmission. MAC addresses are only visible on the local network segment and are not directly accessible by remote servers, though they can be exposed through protocols like IPv6 SLAAC (which embeds the MAC in the address).

Layer 1 (Physical) is the actual hardware: cables, radio waves, and voltage levels. Rarely relevant to software automation.

!!! tip "OSI vs TCP/IP"
    The TCP/IP model (4 layers: Link, Internet, Transport, Application) is what networks actually use. OSI (7 layers) is a teaching tool and reference model. When people say "Layer 7 proxy," they are using OSI terminology, but the actual implementation runs on TCP/IP.

### How Layer Positioning Affects Proxies

The layer where a proxy operates determines what it can and cannot do.

HTTP/HTTPS proxies operate at Layer 7 (Application). Because they understand HTTP, they can read and modify URLs, headers, cookies, and request bodies. They can cache responses intelligently based on HTTP semantics, filter content by URL or keyword, and inject authentication headers. The trade-off is that they only understand HTTP. They cannot proxy FTP, SMTP, SSH, or other protocols, and inspecting HTTPS content requires TLS termination, which means decrypting and re-encrypting the traffic.

SOCKS proxies operate at Layer 5 (Session). Because they sit below the application layer, they are protocol-agnostic and can proxy any Layer 7 protocol without modification. HTTPS traffic passes through encrypted end-to-end, since the SOCKS proxy never needs to decrypt it. SOCKS5 also supports UDP, enabling it to proxy DNS queries, VoIP, and other UDP-based protocols. The trade-off is that SOCKS proxies have no visibility into application-layer data: they cannot cache, filter by URL, or inspect content. They can only filter by IP and port.

!!! note "The Fundamental Tradeoff"
    Higher layers (Layer 7) give you more control but less flexibility. Lower layers (Layer 5) give you less control but more flexibility. Choose HTTP proxies when you need content control, and SOCKS proxies when you need protocol flexibility or end-to-end encryption.

### The Layer Leak Problem

Even with a perfect Layer 7 proxy, lower-layer characteristics can expose your real identity. Your operating system's TCP stack at Layer 4 has a unique fingerprint defined by window size, options order, and TTL values. IP header fields at Layer 3 such as TTL and fragmentation behavior reveal your OS and network topology.

For example, if you configure a proxy to present a "Windows 10" User-Agent but your actual Linux system's TCP fingerprint contradicts this at Layer 4, sophisticated detection systems can flag this inconsistency as a strong bot indicator. This is why network-level fingerprinting (covered in [Network Fingerprinting](../fingerprinting/network-fingerprinting.md)) is so dangerous: it operates below the proxy layer, exposing your real system even when application-layer proxying is flawless.

## TCP vs UDP

At Layer 4 (Transport), two fundamentally different protocols dominate internet communication. They represent opposite design philosophies: reliability versus speed.

TCP is connection-oriented. Think of it like a phone call: you establish a connection, verify the other party is listening, exchange data reliably, then hang up. Every byte is acknowledged, ordered, and guaranteed to arrive. UDP is connectionless. You send your data and hope it arrives. No handshake, no acknowledgments, no guarantees. Just raw speed with minimal overhead.

| Feature | TCP | UDP |
|---------|-----|-----|
| Connection | Connection-oriented (handshake required) | Connectionless (no handshake) |
| Reliability | Guaranteed delivery, ordered packets | Best-effort delivery, packets may be lost |
| Speed | Slower (overhead from reliability mechanisms) | Faster (minimal overhead) |
| Use Cases | Web browsing, file transfer, email | Video streaming, DNS queries, gaming |
| Header Size | 20 bytes minimum (up to 60 with options) | 8 bytes fixed |
| Flow Control | Yes (sliding window, receiver-driven) | No (sender transmits at will) |
| Congestion Control | Yes (slows down when network is congested) | No (application's responsibility) |
| Error Checking | Extensive (checksum + acknowledgments) | Basic (checksum only; optional in IPv4, mandatory in IPv6) |
| Ordering | Packets reordered if received out-of-sequence | No ordering, packets delivered as received |
| Retransmission | Automatic (lost packets retransmitted) | None (application must handle) |

### TCP and Proxies

All proxy protocols (HTTP, HTTPS, SOCKS4, SOCKS5) use TCP for their control channel. This is because proxy authentication and command exchange require guaranteed delivery, proxy protocols have strict command sequences (handshake, then auth, then data), and proxies need persistent connections to track client state.

However, SOCKS5 can also proxy UDP traffic, unlike SOCKS4 or HTTP proxies. This makes SOCKS5 essential for proxying DNS queries, WebRTC audio/video, VoIP, and gaming protocols.

!!! danger "UDP and IP Leakage"
    Most browser connections use TCP (HTTP, WebSocket, etc.), but WebRTC uses UDP directly, bypassing the browser's proxy configuration. This is the most common cause of IP leakage in proxied browser automation: your TCP traffic goes through the proxy while your UDP traffic leaks your real IP.

### The TCP Three-Way Handshake

Before any data can be transmitted, TCP requires a three-way handshake to establish a connection. This negotiation synchronizes sequence numbers, agrees on window sizes, and establishes connection state on both ends.

```mermaid
sequenceDiagram
    participant Client
    participant Server

    Client->>Server: SYN (Synchronize, seq=x)
    Note over Client,Server: Client requests connection

    Server->>Client: SYN-ACK (seq=y, ack=x+1)
    Note over Client,Server: Server acknowledges and sends its own SYN

    Client->>Server: ACK (ack=y+1)
    Note over Client,Server: Connection established, data transfer begins
```

The process starts when the client sends a SYN (Synchronize) packet containing a random Initial Sequence Number (ISN), for example `seq=1000`. Along with the ISN, TCP options are negotiated: window size, Maximum Segment Size (MSS), timestamps, and SACK support.

The server responds with a SYN-ACK: it picks its own random ISN (e.g., `seq=5000`) and acknowledges the client's ISN by setting `ack=1001` (client's ISN + 1). This single packet both establishes the server-to-client direction (SYN) and confirms the client-to-server direction (ACK). The server also returns its own TCP options.

The client then sends a final ACK, acknowledging the server's ISN (`ack=5001`). At this point the connection is fully established in both directions and data transmission can begin.

The ISN is randomized rather than starting from zero to prevent TCP hijacking attacks. If ISNs were predictable, an attacker could inject packets into an existing connection by guessing the sequence numbers. Modern systems use cryptographic randomness for ISN selection (RFC 6528).

### TCP Fingerprinting

The TCP handshake reveals characteristics that fingerprint your operating system. Different OSes use different default values for the initial window size, TCP options order, TTL (Time To Live), window scale factor, and timestamp behavior. These values are set by the kernel, not the browser, so a proxy cannot change them.

Here are illustrative examples for modern operating systems. Note that actual values vary across OS versions, kernel configurations, and network tuning:

```
Windows 10/11 (modern builds):
    Window Size: 65535
    MSS: 1460
    Options: MSS, NOP, WS, NOP, NOP, SACK_PERM
    TTL: 128

Linux (kernel 5.x+, Ubuntu 20.04+):
    Window Size: 29200
    MSS: 1460
    Options: MSS, SACK_PERM, TS, NOP, WS
    TTL: 64

macOS (Monterey+):
    Window Size: 65535
    TTL: 64
```

These differences are burned into the kernel. A proxy cannot change them because they are set by your operating system, not your browser. This is how sophisticated detection systems can identify you even through proxies.

!!! warning "Proxy Limitation"
    HTTP and SOCKS proxies operate above the TCP layer. They cannot modify TCP handshake characteristics. Your OS's TCP fingerprint is always exposed to the proxy server and any network observers between you and the proxy. Only VPN-level solutions or OS-level TCP stack configuration can address this.

!!! note "Beyond TCP Fingerprinting"
    The TCP handshake is just the first fingerprinting opportunity. Immediately after, the TLS handshake reveals another unique fingerprint known as JA3/JA4. See [Network Fingerprinting](../fingerprinting/network-fingerprinting.md) for details on TLS and HTTP/2 fingerprinting.

### UDP

Unlike TCP's reliable, connection-oriented approach, UDP is a fire-and-forget protocol. It trades reliability for minimal latency and overhead, making it ideal for real-time applications where speed matters more than perfect delivery.

A UDP datagram has only an 8-byte header (compared to TCP's 20-60 bytes), containing source port, destination port, length, and a checksum. There is no connection establishment, no reliability guarantee, no flow control, and no congestion control. If a packet is lost, the application must decide whether and how to handle it.

UDP is the right choice for real-time communication (voice/video calls via WebRTC and VoIP), gaming (low-latency state updates), streaming (where occasional frame loss is acceptable), and DNS queries (small request/response pairs where the application handles retries). It is a poor choice for file transfers, web browsing, email, or databases, all of which need reliable, ordered delivery.

DNS is a particularly important example in the context of automation. DNS uses UDP because queries are typically small and benefit from UDP's zero-handshake overhead. While EDNS0 (RFC 6891) increased the maximum UDP DNS payload beyond the original 512-byte limit, most queries remain compact. The DNS client handles retries at the application level if a response does not arrive within a timeout.

For browser automation, the key concern with UDP is that WebRTC uses it for real-time audio and video, DNS queries use it for domain resolution, and most proxies (HTTP, HTTPS, SOCKS4) only handle TCP. Unless you explicitly configure UDP proxying, this traffic bypasses your proxy and leaks your real IP.

| Proxy Type | UDP Support | Notes |
|------------|-------------|-------|
| HTTP Proxy | No | Only proxies TCP-based HTTP/HTTPS |
| HTTPS Proxy (CONNECT) | No | CONNECT method only establishes TCP tunnels |
| SOCKS4 | No | TCP-only protocol |
| SOCKS5 | Yes | Supports UDP relay via `UDP ASSOCIATE` command |
| VPN | Yes | Tunnels all IP traffic (TCP and UDP) |

For true anonymity in browser automation, you need either a SOCKS5 proxy with UDP support and WebRTC configured to use it, WebRTC disabled entirely (which breaks video conferencing), a VPN that tunnels all traffic, or the browser flag `--force-webrtc-ip-handling-policy=disable_non_proxied_udp`.

### QUIC and HTTP/3

Modern browsers increasingly use QUIC (RFC 9000), a UDP-based transport protocol that powers HTTP/3. Since QUIC runs over UDP, it shares the same proxy bypass issues as WebRTC and DNS: most HTTP proxies cannot handle QUIC traffic, and it may leak outside your proxy configuration.

In automation scenarios, consider disabling QUIC with the `--disable-quic` Chrome flag to force HTTP/2 over TCP, ensuring all web traffic passes through your proxy. QUIC also has its own fingerprinting characteristics, similar to JA3 for TLS, which adds another vector for detection.

## WebRTC and IP Leakage

WebRTC (Web Real-Time Communication) is a browser API standardized by the W3C that enables peer-to-peer audio, video, and data communication directly between browsers without plugins or intermediary servers. While powerful for real-time applications, WebRTC is the single biggest source of IP leakage in proxied browser automation.

### How WebRTC Leaks Your IP

WebRTC was designed for direct peer-to-peer connections, optimizing for low latency over privacy. To establish P2P connections, WebRTC must discover your real public IP address and share it with the remote peer, even if your browser is configured to use a proxy.

The problem unfolds like this: your browser uses a proxy for HTTP/HTTPS traffic (which is TCP), but WebRTC uses STUN servers to discover your real public IP over UDP. STUN queries bypass the proxy because most proxies only handle TCP. Your real IP is discovered and shared with remote peers as part of the connection negotiation. JavaScript on the page can read these "ICE candidates" and send your real IP to the website's server.

!!! danger "Severity of WebRTC Leaks"
    Even with an HTTP proxy configured correctly, HTTPS proxy working, DNS queries proxied, User-Agent spoofed, and canvas fingerprinting mitigated, WebRTC can still leak your real IP in milliseconds. This is because WebRTC operates below the browser's proxy layer, directly interfacing with the OS network stack.

### The ICE Process

WebRTC uses ICE (Interactive Connectivity Establishment, RFC 8445) to discover possible connection paths and select the best one. This process inherently reveals your network topology by gathering three types of candidates.

```mermaid
sequenceDiagram
    participant Browser
    participant STUN as STUN Server
    participant TURN as TURN Relay
    participant Peer as Remote Peer

    Note over Browser: WebRTC connection initiated

    Browser->>Browser: Gather local IP addresses<br/>(LAN interfaces)
    Note over Browser: Local candidate:<br/>192.168.1.100:54321

    Browser->>STUN: STUN Binding Request (over UDP)
    Note over STUN: STUN server discovers public IP<br/>(bypasses proxy!)
    STUN->>Browser: STUN Response with real public IP
    Note over Browser: Server reflexive candidate:<br/>203.0.113.45:54321

    Browser->>TURN: Allocate relay (if needed)
    TURN->>Browser: Relay address assigned
    Note over Browser: Relay candidate:<br/>198.51.100.10:61234

    Browser->>Peer: Send all ICE candidates<br/>(local + public + relay)
    Note over Peer: Now knows your:<br/>- LAN IP<br/>- Real public IP<br/>- Relay address

    Peer->>Browser: Send ICE candidates

    Note over Browser,Peer: ICE negotiation: try direct P2P first

    alt Direct P2P succeeds
        Browser<<->>Peer: Direct connection (bypasses proxy entirely!)
    else Direct P2P fails (firewall/NAT)
        Browser->>TURN: Use TURN relay
        TURN<<->>Peer: Relayed connection
        Note over Browser,Peer: Higher latency, but works
    end
```

### ICE Candidate Types

ICE discovers three types of candidates (possible connection endpoints), each revealing different information about your network.

**Host candidates** are your local LAN IP addresses. The browser enumerates all local network interfaces and creates candidates for each. This reveals your local IP addresses on private networks, your network topology (presence of VPN interfaces, VM bridges), and the number of network interfaces.

```javascript
// Example host candidates
candidate:1 1 UDP 2130706431 192.168.1.100 54321 typ host
candidate:2 1 UDP 2130706431 10.0.0.5 54322 typ host
```

Modern browsers (Chrome 75+, Firefox 78+, Safari) mitigate host candidate leaks by replacing local IP addresses with ephemeral mDNS names (e.g., `a1b2c3d4.local`) when media permissions (camera/microphone) have not been granted. However, server reflexive candidates (your public IP) remain exposed regardless of mDNS.

**Server reflexive candidates** are your public IP as seen by a STUN server. The browser sends a STUN request to a public server, which replies with your public IP address. This is the leak everyone talks about: your proxy shows one IP but WebRTC reveals your real one, along with your NAT type, external port mapping, and ISP information.

```javascript
// Server reflexive candidate (your real public IP)
candidate:4 1 UDP 1694498815 203.0.113.45 54321 typ srflx raddr 192.168.1.100 rport 54321
```

**Relay candidates** are TURN server addresses used as fallback when direct P2P fails. The relay candidate may still contain your real IP in the `raddr` (remote address) field, depending on the TURN server implementation.

```javascript
// Relay candidate (TURN server address)
candidate:5 1 UDP 16777215 198.51.100.10 61234 typ relay raddr 203.0.113.45 rport 54321
```

### The STUN Protocol

STUN (Session Traversal Utilities for NAT, RFC 8489) is a simple request-response protocol over UDP. Its job is straightforward: the client asks "what IP do you see me as?" and the server replies with the client's public IP and port.

The client sends a Binding Request containing a magic cookie (`0x2112A442`, a fixed value defined by the RFC) and a random 12-byte transaction ID. The server responds with a Binding Success Response that includes an `XOR-MAPPED-ADDRESS` attribute containing the client's public IP and port as seen from the server's perspective.

The IP address in the response is XOR'ed with the magic cookie and transaction ID. This is not for security but for NAT compatibility: some NAT devices incorrectly modify IP addresses in packet payloads, and XOR'ing obfuscates the address to prevent this interference.

Common public STUN servers used by browsers include `stun.l.google.com:19302` (Google), `stun1.l.google.com:19302` (Google), `stun.services.mozilla.com` (Mozilla), and `stun.stunprotocol.org:3478`.

### Why Proxies Cannot Stop WebRTC Leaks

WebRTC leaks happen for several reinforcing reasons. First, WebRTC uses UDP, and most proxies (HTTP, HTTPS CONNECT, SOCKS4) only handle TCP. Only SOCKS5 supports UDP, and even then the browser must be explicitly configured to route WebRTC through it.

Second, WebRTC is a browser API that operates below the HTTP layer. It directly accesses the OS network stack, bypassing proxy settings configured for HTTP/HTTPS. STUN queries go directly to the network interface, and the OS routing table determines their path, not the browser's proxy configuration. Only VPN-level routing can intercept them.

Third, WebRTC enumerates all network interfaces (physical ethernet, Wi-Fi, VPN adapters, VM bridges), including interfaces not used for regular browsing. This leaks your internal network topology.

Finally, web pages can read ICE candidates via JavaScript using the `RTCPeerConnection.onicecandidate` event, extract IP addresses from candidate strings with a simple regex, and send your real IP to their tracking server.

### Preventing WebRTC Leaks in Pydoll

Pydoll provides multiple strategies for preventing WebRTC IP leaks.

**Method 1: Force WebRTC to only use proxied routes (recommended)**

```python
from pydoll.browser import Chrome
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.webrtc_leak_protection = True  # Adds --force-webrtc-ip-handling-policy=disable_non_proxied_udp
```

Pydoll provides a convenient `webrtc_leak_protection` property that manages the underlying Chrome flag for you. This disables UDP if no proxy supports it, forces WebRTC to use TURN relays only (no direct P2P), and prevents STUN queries to public servers. The trade-off is higher latency for video calls since direct P2P connections are disabled.

**Method 2: Disable WebRTC entirely**

```python
options.add_argument('--disable-features=WebRTC')
```

This completely disables the WebRTC API, eliminating any possibility of IP leaks through this vector. The trade-off is that all WebRTC-dependent sites (video conferencing, voice calls) will break. Note that this flag should be tested with your specific Chrome version, as feature flag names can vary between releases.

**Method 3: Restrict WebRTC via browser preferences**

```python
options.browser_preferences = {
    'webrtc': {
        'ip_handling_policy': 'disable_non_proxied_udp',
        'multiple_routes_enabled': False,
        'nonproxied_udp_enabled': False,
        'allow_legacy_tls_protocols': False
    }
}
```

This achieves the same effect as Method 1 but through preferences rather than command-line flags. `multiple_routes_enabled` prevents using multiple network paths, and `nonproxied_udp_enabled` blocks UDP that does not go through the proxy.

**Method 4: Use a SOCKS5 proxy with UDP support**

```python
options.add_argument('--proxy-server=socks5://proxy.example.com:1080')
options.add_argument('--force-webrtc-ip-handling-policy=default_public_interface_only')
```

SOCKS5 can proxy UDP via its `UDP ASSOCIATE` command, allowing WebRTC's STUN queries to go through the proxy. This requires a SOCKS5 proxy that actually supports UDP relay, which not all do.

!!! warning "SOCKS5 Authentication"
    Chrome does not support SOCKS5 authentication inline (e.g., `socks5://user:pass@host:port`) via the `--proxy-server` flag. Pydoll provides a built-in `SOCKS5Forwarder` that works around this limitation by running a local unauthenticated SOCKS5 proxy that forwards traffic to the remote authenticated proxy, handling the username/password handshake on Chrome's behalf. See [Proxy Configuration](../../features/configuration/proxy.md) for usage details.

### Testing for WebRTC Leaks

You can test manually by visiting [browserleaks.com/webrtc](https://browserleaks.com/webrtc) and checking whether your real IP appears in the "Public IP Address" section. If you see your real IP instead of your proxy IP, you are leaking.

For automated testing with Pydoll:

```python
import asyncio
from pydoll.browser import Chrome
from pydoll.browser.options import ChromiumOptions

async def test_webrtc_leak():
    options = ChromiumOptions()
    options.add_argument('--proxy-server=http://proxy.example.com:8080')
    options.add_argument('--force-webrtc-ip-handling-policy=disable_non_proxied_udp')

    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://browserleaks.com/webrtc')

        await asyncio.sleep(3)

        ips = await tab.execute_script('''
            return Array.from(document.querySelectorAll('.ip-address'))
                .map(el => el.textContent.trim());
        ''')

        print("Detected IPs:", ips)
        # Should only show proxy IP, not your real IP

asyncio.run(test_webrtc_leak())
```

!!! danger "Always Test WebRTC Leaks"
    Never assume your proxy configuration prevents WebRTC leaks. Always verify with [browserleaks.com/webrtc](https://browserleaks.com/webrtc) or [ipleak.net](https://ipleak.net). Even a single WebRTC leak instantly compromises your entire proxy setup, since the website now knows your real location, ISP, and network topology.

### How Websites Exploit WebRTC Leaks

Websites can intentionally trigger WebRTC to extract your real IP using a few lines of JavaScript:

```javascript
const pc = new RTCPeerConnection({
    iceServers: [{urls: 'stun:stun.l.google.com:19302'}]
});

pc.createDataChannel('');
pc.createOffer().then(offer => pc.setLocalDescription(offer));

pc.onicecandidate = (event) => {
    if (event.candidate) {
        const ipRegex = /([0-9]{1,3}(\.[0-9]{1,3}){3})/;
        const ipMatch = event.candidate.candidate.match(ipRegex);

        if (ipMatch) {
            const realIP = ipMatch[1];
            fetch(`/track?real_ip=${realIP}&proxy_ip=${window.clientIP}`);
        }
    }
};
```

This code creates an RTCPeerConnection, triggers ICE candidate gathering (which contacts STUN servers), extracts IP addresses from the candidates with a regex, and sends your real IP to a tracking server. Disabling WebRTC or forcing proxied-only routes as described above prevents this.

## Summary

Proxies operate at specific layers of the network stack: HTTP at Layer 7, SOCKS at Layer 5. The layer determines what the proxy can see, modify, and hide. TCP fingerprints (window size, options, TTL) leak from lower layers and reveal your real OS even through a proxy. UDP traffic, including WebRTC and DNS, often bypasses proxies unless explicitly configured. WebRTC is the most common source of IP leakage, and only SOCKS5 or a VPN can proxy UDP traffic effectively. Modern browsers also use QUIC (HTTP/3 over UDP), which adds another potential bypass vector.

**Next steps:**

- [HTTP/HTTPS Proxies](./http-proxies.md): Application-layer proxying
- [SOCKS Proxies](./socks-proxies.md): Session-layer, protocol-agnostic proxying
- [Network Fingerprinting](../fingerprinting/network-fingerprinting.md): TCP/IP and TLS fingerprinting techniques
- [Proxy Configuration](../../features/configuration/proxy.md): Practical Pydoll proxy setup

## References

- RFC 793: Transmission Control Protocol (TCP) - https://tools.ietf.org/html/rfc793
- RFC 768: User Datagram Protocol (UDP) - https://tools.ietf.org/html/rfc768
- RFC 8489: Session Traversal Utilities for NAT (STUN) - https://tools.ietf.org/html/rfc8489
- RFC 8445: Interactive Connectivity Establishment (ICE) - https://tools.ietf.org/html/rfc8445
- RFC 8656: Traversal Using Relays around NAT (TURN) - https://tools.ietf.org/html/rfc8656
- RFC 6528: Defending Against Sequence Number Attacks - https://tools.ietf.org/html/rfc6528
- RFC 9000: QUIC: A UDP-Based Multiplexed and Secure Transport - https://tools.ietf.org/html/rfc9000
- W3C WebRTC 1.0: Real-Time Communication Between Browsers - https://www.w3.org/TR/webrtc/
- BrowserLeaks: WebRTC Leak Test - https://browserleaks.com/webrtc
- IPLeak: Comprehensive Leak Testing - https://ipleak.net


================================================
FILE: docs/en/deep-dive/network/proxy-detection.md
================================================
# Proxy Detection

Proxy detection is a probabilistic process. Websites combine dozens of signals to assess whether a connection is proxied, ranging from simple IP reputation lookups to TCP/IP stack analysis and behavioral profiling. No single signal provides definitive proof, but combining enough weak signals produces high-confidence decisions.

This document covers the main detection techniques, how they work at a technical level, and what they mean for browser automation with Pydoll.

!!! info "Module Navigation"
    - [SOCKS Proxies](./socks-proxies.md): Session-layer proxying
    - [HTTP/HTTPS Proxies](./http-proxies.md): Application-layer proxying
    - [Network Fundamentals](./network-fundamentals.md): TCP/IP, UDP, WebRTC

    For fingerprinting details, see [Network Fingerprinting](../fingerprinting/network-fingerprinting.md) and [Browser Fingerprinting](../fingerprinting/browser-fingerprinting.md).

## IP Reputation

IP reputation analysis is the most widely deployed proxy detection technique. It combines publicly available data (ASN records, WHOIS, geolocation databases) with proprietary intelligence to classify IP addresses into risk categories.

### ASN Classification

Every IP address belongs to an Autonomous System (AS), identified by an ASN. The type of AS that owns an IP is the strongest single indicator of whether it is a proxy.

IPs belonging to cloud and hosting providers (AWS, DigitalOcean, OVH, Hetzner) are flagged as high risk because real users do not browse the web from datacenter servers. IPs from residential ISPs (Comcast, Deutsche Telekom, BT) are low risk because they look like normal home connections. Mobile carrier IPs (Verizon Wireless, AT&T Mobility) are the lowest risk because they are the hardest to distinguish from real mobile users.

Some ASNs are associated with known proxy infrastructure, though this is more nuanced than it might seem. Large residential proxy providers like BrightData or Smartproxy do not operate their own ASNs; they route traffic through real residential IPs belonging to ISP ASNs. This is precisely what makes residential proxies harder to detect than datacenter proxies.

Detection systems query ASN databases (Team Cymru, RIPE NCC, ARIN) and commercial IP intelligence APIs to classify each connecting IP. Datacenter IPs are detected with roughly 95%+ accuracy because the ASN classification is unambiguous. Residential proxy detection is much harder (roughly 40-70% accuracy) because the IPs genuinely belong to ISPs. Mobile proxy detection is the most difficult (roughly 20-40%) because mobile carrier NAT makes many real users share IPs.

This accuracy gradient is why residential and mobile proxies command 10-100x the price of datacenter proxies.

### Known Proxy Databases

Beyond ASN classification, specialized databases track IPs that have been observed participating in proxy networks. Services like IPQualityScore, proxycheck.io, and Spur.us maintain real-time databases of known proxy, VPN, and Tor exit node IPs. The Tor exit node list is publicly available at [check.torproject.org](https://check.torproject.org/torbulkexitlist).

These databases also track behavioral signals: IPs that rotate frequently (typical of proxy pools), IPs with abnormally high concurrent session counts (a residential IP normally has 1-5 concurrent connections, not 100+), and IPs previously associated with bot-like activity.

### Geolocation Consistency

Proxies often reveal themselves through geographic inconsistencies. The IP address points to one location, but browser-reported signals point to another.

The most common mismatches are between the IP's geolocation and the browser's timezone (collected via JavaScript's `Intl.DateTimeFormat().resolvedOptions().timeZone`), between the IP's country and the `Accept-Language` header, and between the current session's location and a previous session's location. A user appearing in Los Angeles with a browser timezone of `Europe/Berlin` is suspicious. A user appearing in Tokyo 10 minutes after their last session was in New York is physically impossible.

Detection systems also check whether the IP's geolocation matches the locale configuration of the browser. A US datacenter IP with `Accept-Language: zh-CN` and timezone `Asia/Shanghai` strongly suggests a Chinese user routing through a US proxy.

!!! note "False Positives"
    Legitimate scenarios trigger geolocation alarms: travelers using VPNs, expats with browser settings from their home country, corporate users connecting through company VPNs, and multilingual users with non-default language preferences. Sophisticated systems use risk scoring rather than binary blocking to account for these cases.

## HTTP Header Analysis

HTTP headers are the simplest detection vector. Transparent and anonymous proxies add headers like `Via`, `X-Forwarded-For`, `X-Real-IP`, and `Forwarded` (RFC 7239) that directly reveal proxy usage. Elite proxies strip these headers, but their absence alone is not proof of a direct connection.

Detection goes beyond looking for proxy-specific headers. Missing headers that real browsers always send (like `Accept-Language`, `Accept-Encoding`, or a realistic `User-Agent`) are suspicious. Header ordering matters too: browsers send headers in a consistent, version-specific order, and proxies or automation tools that construct headers manually often get the order wrong.

The legacy `Proxy-Connection: keep-alive` header, sent by some older clients when routing through a proxy, is another classic detection signal.

### Proxy Anonymity Levels

Proxies are traditionally classified into three anonymity levels based on their header behavior:

| Level | Behavior | Detection |
|-------|----------|-----------|
| Transparent | Forwards your real IP in `X-Forwarded-For`, adds `Via` header | Trivial |
| Anonymous | Hides your IP but adds `Via` or other proxy headers | Easy |
| Elite | Strips all proxy-identifying headers | Requires deeper analysis |

This classification dates from an era when header analysis was the primary detection method. Modern detection systems use IP reputation, fingerprinting, and behavioral analysis, making the transparent/anonymous/elite distinction less meaningful. An elite proxy with a datacenter IP is detected instantly through ASN lookup. A transparent proxy on a residential IP might still pass under the radar on less sophisticated sites.

## Network Fingerprinting

Network-layer fingerprinting operates below the proxy layer, which means it can detect proxies even when the proxy itself is configured perfectly.

### TCP/IP Fingerprinting

Every operating system has a unique TCP stack implementation that reveals itself during the TCP handshake. The initial window size, TCP options order, TTL (Time To Live), and window scale factor are all set by the kernel, not the browser, and cannot be changed by a proxy.

Detection systems compare these TCP characteristics against the `User-Agent` header. If the User-Agent claims Windows 10 but the TCP fingerprint shows Linux characteristics (TTL of 64, window size of 29200), the mismatch is a strong proxy indicator. Windows uses a default TTL of 128 and modern builds typically show a window size of 65535, while Linux uses TTL 64 and window sizes around 29200.

TTL analysis adds another layer. The TTL decreases by 1 at each network hop. If a Windows connection arrives with a TTL of 128, the client is likely on the same network. If it arrives with a TTL of 115, it has crossed roughly 13 hops. If the TTL value does not align with the expected hop count for the IP's geographic location, proxy routing is likely.

For detailed TCP fingerprint values and their implications, see [Network Fingerprinting](../fingerprinting/network-fingerprinting.md).

### TLS Fingerprinting (JA3/JA4)

The TLS ClientHello message is transmitted in plaintext and contains enough parameters to uniquely identify the client application: TLS version, supported cipher suites, extensions, elliptic curves, and signature algorithms. The JA3 fingerprint is an MD5 hash of these parameters concatenated in a specific order. JA4 is a newer, more granular alternative.

Each browser version produces a distinctive JA3/JA4 fingerprint. Detection systems maintain databases of known fingerprints for Chrome, Firefox, Safari, and other browsers. If the JA3 fingerprint does not match any known browser, or does not match the browser claimed in the User-Agent, the connection is flagged.

An important nuance: SOCKS5 proxies and HTTP CONNECT tunnels pass the TLS ClientHello through unmodified, so the target server sees the real browser fingerprint. The proxy does not alter TLS parameters in these configurations. Only MITM proxies (which terminate and re-establish TLS) change the fingerprint, and in that case the fingerprint belongs to the proxy software, not a real browser, which is itself a detection signal.

### HTTP/2 Fingerprinting

HTTP/2 connections expose fingerprinting signals that are distinct from TLS. The SETTINGS frame sent at the beginning of an HTTP/2 connection contains parameters like `HEADER_TABLE_SIZE`, `MAX_CONCURRENT_STREAMS`, `INITIAL_WINDOW_SIZE`, and `MAX_HEADER_LIST_SIZE`. Each browser uses different default values for these settings.

The order and priority of pseudo-headers (`:method`, `:authority`, `:scheme`, `:path`), the HPACK compression behavior, and stream priority weights also vary between browsers. Tools like [browserleaks.com/http2](https://browserleaks.com/http2) show what your HTTP/2 fingerprint looks like.

Automation frameworks and proxy software that implement their own HTTP/2 stacks often produce fingerprints that do not match any real browser, making this an effective detection vector.

### Latency-Based Detection

The network latency between a client and a server reveals information about the physical network path. If the IP geolocates to New York but the round-trip time suggests a path through Asia, the connection is likely proxied.

Detection systems measure RTT (round-trip time) during the TCP handshake and compare it against expected latencies for the IP's geographic location. They may also issue JavaScript-based timing challenges that measure latency from the browser's perspective, then compare this with the server-observed latency. A significant discrepancy between the two suggests an intermediary (proxy) in the path.

Clock skew analysis adds another dimension: by measuring the client's clock offset via JavaScript (`Date.now()`) or HTTP `Date` headers, detection systems can infer the client's actual timezone and compare it against the IP's expected timezone.

## Behavioral Detection

The most advanced detection systems go beyond network and protocol analysis to examine user behavior. This includes request timing (are requests evenly spaced, suggesting automation?), mouse movement patterns (analyzed via JavaScript event listeners), scrolling behavior, keyboard input cadence, and overall browsing patterns.

Machine learning models trained on millions of real user sessions can distinguish human behavior from automation with high accuracy. These models typically combine 50+ features including navigation patterns, session duration distribution, click positions, form interaction timing, and JavaScript execution characteristics.

Pydoll's humanized interactions (Bezier curve mouse movement, Fitts's Law timing, realistic typing) are designed specifically to pass behavioral analysis. See [Evasion Techniques](../fingerprinting/evasion-techniques.md) for the full multi-layer evasion strategy.

## Multi-Signal Risk Scoring

Modern detection systems do not rely on any single technique. They combine all available signals into a risk score, typically 0-100, and apply thresholds that vary by industry and context.

The weight of each signal category varies, but a rough approximation is that IP reputation accounts for the largest share (it is the cheapest and most reliable signal), followed by network fingerprinting (TCP/IP, TLS, HTTP/2), header and protocol analysis, behavioral scoring, and consistency checks (geolocation, timezone, language).

Thresholds depend on the business context. Banking sites block aggressively (risk score above 50), e-commerce sites present CAPTCHAs at moderate scores (above 70), and content sites tend to be more permissive (blocking only above 80) since they rely on ad impressions.

The implication for automation is that passing one layer of detection is not enough. A residential IP (good IP reputation) with a mismatched TCP fingerprint and robotic behavior will still be flagged. Effective evasion requires consistency across all layers.

## Detection by Proxy Type

| Proxy Type | Detection Difficulty | Primary Detection Methods |
|------------|----------------------|---------------------------|
| Transparent HTTP | Trivial | HTTP headers (`Via`, `X-Forwarded-For`) |
| Anonymous HTTP | Easy | HTTP headers + IP reputation |
| Elite HTTP (datacenter) | Medium | IP reputation (ASN analysis) |
| Datacenter SOCKS5 | Medium | IP reputation (ASN analysis) |
| Residential proxies | Difficult | Behavioral analysis, connection patterns, latency |
| Mobile proxies | Very difficult | Mostly behavioral, limited network signals |
| Rotating proxies | Difficult | Session inconsistencies, IP rotation patterns |

## Evasion Principles

Effective evasion is about consistency across all detection layers, not perfecting any single one.

Use residential or mobile IPs when stealth matters. They are harder to detect because the IPs genuinely belong to ISPs, and the cost premium reflects this advantage. Match the browser's geolocation signals (timezone, language, locale) to the proxy IP's location. Maintain session persistence by not rotating IPs mid-session, which creates detectable discontinuities. Ensure your TCP/IP fingerprint matches your User-Agent claim by running automation on the same OS you are impersonating. Use Pydoll's humanized interactions to pass behavioral analysis. And always test for leaks (WebRTC, DNS, timezone) before running automation at scale.

The goal is not to make detection impossible but to make it expensive and uncertain. Force the detection system to use multiple correlated signals, blend in with legitimate traffic patterns, and create plausible deniability.

!!! warning "No Proxy is Undetectable"
    With sufficient resources, any proxy can be detected. Even top-tier residential proxies achieve roughly 70-90% success rates against sophisticated anti-bot systems like Akamai, Cloudflare Enterprise, and DataDome. The practical question is whether detection is economically worthwhile for the target site.

**Next steps:**

- [Network Fingerprinting](../fingerprinting/network-fingerprinting.md): TCP/IP and TLS fingerprinting in detail
- [Browser Fingerprinting](../fingerprinting/browser-fingerprinting.md): Canvas, WebGL, HTTP/2 fingerprinting
- [Evasion Techniques](../fingerprinting/evasion-techniques.md): Multi-layer evasion strategy
- [Proxy Configuration](../../features/configuration/proxy.md): Practical Pydoll proxy setup

## References

- MaxMind GeoIP2: https://www.maxmind.com/en/geoip2-services-and-databases
- IPQualityScore Proxy Detection: https://www.ipqualityscore.com/proxy-vpn-tor-detection-service
- Spur.us (Anonymous IP Detection): https://spur.us/
- Team Cymru IP to ASN Mapping: https://www.team-cymru.com/ip-asn-mapping
- Salesforce Engineering: TLS Fingerprinting with JA3 and JA3S - https://engineering.salesforce.com/tls-fingerprinting-with-ja3-and-ja3s-247362855967/
- Akamai: Passive Fingerprinting of HTTP/2 Clients (Black Hat EU 2017) - https://blackhat.com/docs/eu-17/materials/eu-17-Shuster-Passive-Fingerprinting-Of-HTTP2-Clients-wp.pdf
- Incolumitas: TCP/IP Fingerprinting for VPN and Proxy Detection - https://incolumitas.com/2021/03/13/tcp-ip-fingerprinting-for-vpn-and-proxy-detection/
- Incolumitas: Detecting Proxies and VPNs with Latencies - https://incolumitas.com/2021/06/07/detecting-proxies-and-vpn-with-latencies/
- BrowserLeaks HTTP/2 Fingerprint: https://browserleaks.com/http2
- BrowserLeaks IP: https://browserleaks.com/ip
- RFC 7239: Forwarded HTTP Extension - https://www.rfc-editor.org/rfc/rfc7239.html
- RFC 9110: HTTP Semantics - https://www.rfc-editor.org/rfc/rfc9110.html


================================================
FILE: docs/en/deep-dive/network/proxy-legal.md
================================================
# Legal and Ethical Considerations

This document provides **general information** about the legal and ethical landscape of proxy usage and web automation. Laws vary wildly by jurisdiction and use case. This is **not legal advice**. Always consult qualified legal counsel for your specific situation.

!!! info "Module Navigation"
    - **[← Building Proxies](./build-proxy.md)** - Implementation and advanced topics
    - **[← Proxy Detection](./proxy-detection.md)** - Anonymity and evasion
    - **[← Network & Security Overview](./index.md)** - Module introduction
    
    For responsible automation, see **[Behavioral Captcha Bypass](../../features/advanced/behavioral-captcha-bypass.md)** and **[Human-Like Interactions](../../features/automation/human-interactions.md)**.

!!! danger "Legal Disclaimer"
    This document provides **educational information only**. It is **not legal advice**. Laws regarding web scraping, automation, and proxy usage vary by jurisdiction and are subject to interpretation. Consult qualified legal counsel before engaging in activities that may have legal implications.

## Legal and Ethical Considerations

Proxy usage sits at the intersection of privacy, security, and compliance. Understanding the legal landscape is essential for responsible automation.

### Regulatory Compliance

Different jurisdictions have varying rules regarding proxy usage and data collection:

| Region | Key Regulation | Proxy Implications |
|--------|----------------|-------------------|
| **European Union** | GDPR | IP addresses are personal data; proxy exit nodes in EU must comply |
| **United States** | CFAA, State Laws | Circumventing access controls may violate computer fraud laws |
| **China** | Cybersecurity Law | VPN/proxy usage heavily regulated; only approved services permitted |
| **Russia** | VPN Law | VPN providers must register and log user activity |
| **Australia** | Privacy Act | Data collection through proxies subject to privacy principles |

**GDPR-specific considerations:**

**IP addresses as personal data (Article 4):**

When scraping EU-based websites through proxies:

- Your proxy's EU IP is considered personal data
- Websites must handle it per GDPR requirements  
- You must have lawful basis for data collection
- Data minimization principle applies

**Lawful bases for processing (Article 6):**

1. **Consent** - Hard to obtain for scraping
2. **Contract** - Legitimate if you're a customer
3. **Legal obligation** - Rare for scraping use cases
4. **Vital interests** - Not applicable to scraping
5. **Public task** - Not applicable to scraping
6. **Legitimate interests** - Most applicable for scraping (balance test required)

### Terms of Service and Access Restrictions

Proxies don't exempt you from website ToS:

**Common ToS violations:**

1. **Automated Access**: Many sites prohibit bots/scrapers regardless of IP
2. **Rate Limiting Circumvention**: Using rotating proxies to bypass rate limits
3. **Geographic Restrictions**: Bypassing geo-blocks may violate content licensing agreements
4. **Account Sharing**: Using proxies to mask multiple users as one

**Legal precedent examples:**

```python
# Notable cases (simplified, not legal advice)
cases = {
    'hiQ Labs v. LinkedIn (2022)': {
        'issue': 'Scraping public data after access revoked',
        'outcome': 'Scraping publicly available data generally permitted',
        'caveat': 'But circumventing technological barriers may violate CFAA'
    },
    
    'QVC v. Resultly (2020)': {
        'issue': 'Aggressive scraping causing server load',
        'outcome': 'Excessive requests constitute trespass to chattels',
        'implication': 'Volume and impact matter, not just technical access'
    }
}
```

### Ethical Guidelines for Proxy Usage

Beyond legal compliance, consider these ethical principles:

**1. Respect robots.txt**
```python
# Even with proxies, honor site guidelines
async def ethical_scraping(url):
    # Check robots.txt regardless of proxy anonymity
    if not is_allowed_by_robots(url):
        return None  # Respect the site's wishes
```

**2. Rate Limiting**
```python
# Don't abuse proxy rotation to overwhelm servers
MINIMUM_DELAY = 1.0  # seconds between requests
MAX_CONCURRENT = 5   # concurrent connections per site

# Bad: Rotating proxies to scrape at 1000 req/sec
# Good: Respectful scraping even with proxy rotation
```

**3. Transparency**
```python
# Identify yourself in User-Agent when appropriate
headers = {
    'User-Agent': 'MyBot/1.0 (contact@example.com)',  # Honest identification
    # Not: 'Mozilla/5.0...'  # Deceptive when not a browser
}
```

**4. Data Minimization**
```python
# Collect only what you need
# Just because you can scrape everything doesn't mean you should
data_to_collect = {
    'product_name': True,
    'price': True,
    'user_emails': False,      # PII - don't collect unless necessary
    'user_addresses': False,   # PII - privacy concerns
}
```

### Compliance Checklist

Before deploying proxy-based automation:

- [ ] **Legal Review**: Consult legal counsel for your jurisdiction
- [ ] **ToS Compliance**: Review target website terms of service
- [ ] **Data Protection**: Ensure GDPR/CCPA compliance if handling personal data
- [ ] **Access Rights**: Verify you have permission to access the data
- [ ] **Rate Limiting**: Implement respectful request rates
- [ ] **Error Handling**: Handle 429 (Too Many Requests) appropriately
- [ ] **Logging**: Maintain audit trails for compliance purposes
- [ ] **Data Retention**: Implement appropriate data retention/deletion policies
- [ ] **Security**: Protect collected data with appropriate measures
- [ ] **Transparency**: Be honest about your scraping activities when questioned

!!! warning "This is Not Legal Advice"
    This section provides general information only. Proxy usage legality varies by jurisdiction, context, and specific circumstances. Always consult qualified legal counsel for your specific situation.

!!! tip "Responsible Proxy Usage"
    The most defensible proxy usage is:
    
    - **Transparent**: You can explain why you're doing it
    - **Necessary**: You have a legitimate reason (research, monitoring, etc.)
    - **Proportional**: Your methods match your needs (not excessive)
    - **Documented**: You keep records of your activities
    - **Compliant**: You follow all applicable laws and ToS

### When to Avoid Proxies

Some scenarios where proxy usage is problematic:

| Scenario | Risk | Alternative |
|----------|------|-------------|
| **Banking/Financial Sites** | Fraud detection, account suspension | Use legitimate access only |
| **Government Portals** | Legal penalties, security investigations | Direct access from authorized locations |
| **Healthcare Data** | HIPAA violations, severe penalties | Use authorized API access |
| **Internal Corporate Systems** | Policy violations, termination | Follow company IT policies |
| **E-commerce Account Creation** | Fraud flags, permanent bans | Use single, verified identity |

## Conclusion

Understanding proxy architecture deeply enables you to:

**Make Informed Decisions:**
- Choose the right proxy type for your use case
- Understand security implications
- Identify when proxies are necessary vs optional

**Troubleshoot Effectively:**
- Debug connection issues
- Identify DNS leaks or IP leakage
- Diagnose performance problems

**Optimize Performance:**
- Configure appropriate timeouts
- Implement connection pooling
- Monitor proxy health

**Build Better Automation:**
- Combine proxies with anti-detection techniques
- Implement robust error handling
- Scale proxy usage efficiently

The proxy landscape is complex, but with this foundation, you're equipped to navigate it successfully.

## Further Reading

- **[RFC 1928](https://tools.ietf.org/html/rfc1928)**: SOCKS5 Protocol specification
- **[RFC 1929](https://tools.ietf.org/html/rfc1929)**: SOCKS5 Username/Password Authentication
- **[RFC 2616](https://tools.ietf.org/html/rfc2616)**: HTTP/1.1 (CONNECT method)
- **[RFC 5389](https://tools.ietf.org/html/rfc5389)**: STUN Protocol
- **[RFC 9298](https://tools.ietf.org/html/rfc9298)**: CONNECT-UDP (HTTP/3 proxying)
- **[Proxy Configuration Guide](../features/configuration/proxy.md)**: Practical Pydoll proxy usage, authentication, rotation, and testing
- **[Request Interception](../features/network/interception.md)**: How Pydoll implements proxy authentication internally
- **[Network Capabilities Deep Dive](./network-capabilities.md)**: How Pydoll handles network operations

!!! tip "Experimentation"
    The best way to truly understand proxies is to:
    
    1. Set up your own proxy server (use the code above)
    2. Capture traffic with Wireshark to see raw packets
    3. Test different proxy types with real automation
    4. Intentionally create leaks and learn to detect them
    
    Hands-on experience solidifies theoretical knowledge!


================================================
FILE: docs/en/deep-dive/network/socks-proxies.md
================================================
# SOCKS Protocol Architecture

SOCKS (SOCKet Secure) is a proxying protocol that operates between the transport and application layers of the network stack (commonly described as Layer 5 in the OSI model). Unlike HTTP proxies, which parse and understand HTTP traffic, SOCKS proxies forward raw TCP and UDP connections without inspecting their content. This protocol-agnostic design makes SOCKS the preferred choice for privacy-focused automation: the proxy never needs to parse your requests, inject headers, or terminate TLS connections.

This document covers how SOCKS works at the protocol level, the differences between SOCKS4 and SOCKS5, authentication handling in Chrome, DNS resolution behavior, and practical configuration in Pydoll.

!!! info "Module Navigation"
    - [HTTP/HTTPS Proxies](./http-proxies.md): Application-layer proxying
    - [Network Fundamentals](./network-fundamentals.md): TCP/IP, UDP, OSI model
    - [Network & Security Overview](./index.md): Module introduction
    - [Proxy Detection](./proxy-detection.md): Anonymity levels and detection evasion
    - [Building Proxies](./build-proxy.md): SOCKS5 implementation from scratch

    For practical configuration, see [Proxy Configuration](../../features/configuration/proxy.md).

## How SOCKS Differs from HTTP Proxies

The fundamental difference lies in what each proxy can see and do. An HTTP proxy operates at the application layer and understands HTTP: it can read URLs, headers, cookies, and request bodies (for unencrypted traffic), modify them in transit, cache responses, and inject its own headers like `Via` and `X-Forwarded-For`. This is powerful for content filtering but means you must trust the proxy operator with your application data.

A SOCKS proxy operates below the application layer. It sees only the destination address, port, and the volume of data being transferred. It does not parse, modify, or even understand what protocol is flowing through it. HTTP, HTTPS, FTP, SSH, WebSocket, or any custom protocol all look the same to a SOCKS proxy: just bytes being relayed between two endpoints.

This has a direct practical implication. When you send an HTTPS request through a SOCKS5 proxy, the proxy sees `example.com:443` and the encrypted TLS stream. It cannot read the URL, headers, cookies, or response content. It does not add identifying headers. It does not need to terminate TLS. The encrypted tunnel runs end-to-end between your browser and the target server.

However, it is important to understand what SOCKS does not provide. SOCKS is a proxying protocol, not an encryption protocol. The name "SOCKet Secure" refers to secure firewall traversal, not cryptographic security. If you send unencrypted HTTP traffic through a SOCKS5 proxy, the proxy operator can read the bytes passing through, even though the proxy is not designed to inspect them. For actual encryption, you need TLS/HTTPS on top of SOCKS, or an encrypted tunnel (SSH, VPN) wrapping the SOCKS connection.

!!! note "Trust Model"
    With HTTP proxies, you trust the proxy operator not to log your browsing history, steal tokens, modify responses, or perform MITM attacks. With SOCKS5, you trust the proxy only to forward packets correctly and not log connection metadata. The attack surface is smaller, but it is not zero.

## SOCKS4 vs SOCKS5

SOCKS has two versions in common use. SOCKS4 was developed by NEC in the early 1990s as an informal standard with no RFC. SOCKS5 was standardized as RFC 1928 in 1996 to address SOCKS4's limitations.

| Feature | SOCKS4 | SOCKS5 |
|---------|--------|--------|
| Standard | No official RFC (de facto, 1992) | RFC 1928 (1996) |
| Authentication | Identification only (USERID field, no password) | Multiple methods (none, username/password, GSSAPI) |
| IP version | IPv4 only | IPv4 and IPv6 |
| UDP support | No | Yes (UDP ASSOCIATE command) |
| DNS resolution | Client-side (SOCKS4A extension adds server-side) | Server-side when using domain names (ATYP=0x03) |
| Protocol support | TCP only | TCP and UDP |

SOCKS5 is superior in every practical way. Use SOCKS4 only if the proxy does not support SOCKS5.

## The SOCKS5 Handshake

The SOCKS5 connection process follows RFC 1928 and consists of three phases: method negotiation, optional authentication, and the connection request.

```mermaid
sequenceDiagram
    participant Client
    participant SOCKS5 as SOCKS5 Proxy
    participant Server as Target Server

    Note over Client,SOCKS5: Phase 1: Method Negotiation
    Client->>SOCKS5: Hello [VER=5, NMETHODS, METHODS]
    SOCKS5->>Client: Method Selected [VER=5, METHOD]

    Note over Client,SOCKS5: Phase 2: Authentication (if required)
    Client->>SOCKS5: Auth Request [VER=1, ULEN, UNAME, PLEN, PASSWD]
    SOCKS5->>Client: Auth Response [VER=1, STATUS]

    Note over Client,SOCKS5: Phase 3: Connection Request
    Client->>SOCKS5: Connect [VER=5, CMD=CONNECT, DST.ADDR, DST.PORT]
    SOCKS5->>Server: Establish TCP connection
    Server-->>SOCKS5: Connection established
    SOCKS5->>Client: Reply [VER=5, REP=SUCCESS, BND.ADDR, BND.PORT]

    Note over Client,Server: Data relay (proxied)
    Client->>SOCKS5: Application data
    SOCKS5->>Server: Forward data
    Server->>SOCKS5: Response data
    SOCKS5->>Client: Forward response
```

### Phase 1: Method Negotiation

The client opens a TCP connection to the proxy and sends a greeting containing the protocol version (always `0x05` for SOCKS5) and a list of authentication methods it supports.

```python
# Client Hello
[
    0x05,        # VER: Protocol version (5)
    0x02,        # NMETHODS: Number of methods offered
    0x00, 0x02   # METHODS: No auth (0x00) and Username/Password (0x02)
]
```

The proxy responds with the method it selects. If the proxy requires authentication and the client offered `0x02` (username/password), the proxy selects it. If no acceptable method was offered, the proxy responds with `0xFF` and closes the connection.

```python
# Server response
[
    0x05,   # VER: Protocol version (5)
    0x02    # METHOD: Username/Password selected
]
```

Method codes defined by RFC 1928: `0x00` = no authentication, `0x01` = GSSAPI, `0x02` = username/password (RFC 1929), `0x03-0x7F` = IANA assigned, `0x80-0xFE` = reserved for private methods, `0xFF` = no acceptable methods.

### Phase 2: Authentication

If the proxy selected method `0x02`, the client sends credentials following RFC 1929. The subnegotiation uses its own version number (`0x01`, not `0x05`).

```python
# Client authentication
[
    0x01,              # VER: Subnegotiation version (1)
    len(username),     # ULEN: Username length (max 255)
    *username_bytes,   # UNAME: Username
    len(password),     # PLEN: Password length (max 255)
    *password_bytes    # PASSWD: Password
]

# Server response
[
    0x01,   # VER: Subnegotiation version (1)
    0x00    # STATUS: 0 = success, non-zero = failure
]
```

Credentials are transmitted in plaintext during this handshake. This is inherent to the SOCKS5 protocol (RFC 1929). For sensitive environments, wrap the SOCKS connection in an SSH tunnel or VPN.

### Phase 3: Connection Request

After authentication succeeds (or if no authentication was required), the client sends a connection request specifying the command, destination address, and port.

```python
[
    0x05,          # VER: Protocol version (5)
    0x01,          # CMD: 1=CONNECT, 2=BIND, 3=UDP ASSOCIATE
    0x00,          # RSV: Reserved
    0x03,          # ATYP: 1=IPv4 (4 bytes), 3=Domain (length+name), 4=IPv6 (16 bytes)
    len(domain),   # Domain length (only for ATYP=0x03)
    *domain_bytes, # Domain name
    *port_bytes    # Port (2 bytes, big-endian)
]
```

The address type (ATYP) determines the format: `0x01` means 4 bytes of IPv4 address follow, `0x04` means 16 bytes of IPv6, and `0x03` means a length byte followed by the domain name. When the client sends a domain name (ATYP=0x03), the proxy resolves DNS on its side, which prevents DNS leaks to the client's local network.

The proxy connects to the destination and responds with a reply:

```python
[
    0x05,       # VER: Protocol version (5)
    0x00,       # REP: 0x00=success, 0x01-0x08=various errors
    0x00,       # RSV: Reserved
    0x01,       # ATYP: Address type of bound address
    *bind_addr, # BND.ADDR: Address the proxy bound to
    *bind_port  # BND.PORT: Port the proxy bound to
]
```

Reply codes: `0x00` succeeded, `0x01` general failure, `0x02` connection not allowed, `0x03` network unreachable, `0x04` host unreachable, `0x05` connection refused, `0x06` TTL expired, `0x07` command not supported, `0x08` address type not supported.

After a successful reply, the proxy begins relaying data bidirectionally. The entire SOCKS5 handshake is a binary protocol, making it more efficient than text-based HTTP but harder to debug without hex dumps.

## UDP Support

SOCKS5 supports UDP proxying through the `UDP ASSOCIATE` command (CMD=0x03). This works differently from TCP proxying: the client sends a UDP ASSOCIATE request over the TCP control connection, and the proxy responds with a relay address and port. The client then sends UDP datagrams to this relay, and the proxy forwards them to their destinations.

```mermaid
sequenceDiagram
    participant Client
    participant SOCKS5
    participant UDP_Server as UDP Server

    Note over Client,SOCKS5: TCP control connection (handshake + auth)
    Client->>SOCKS5: UDP ASSOCIATE request (CMD=0x03)
    SOCKS5->>Client: Relay address and port

    Note over Client,SOCKS5: UDP data transfer
    Client->>SOCKS5: UDP datagram to relay
    SOCKS5->>UDP_Server: Forward datagram
    UDP_Server->>SOCKS5: Response datagram
    SOCKS5->>Client: Forward response

    Note over Client,SOCKS5: TCP control connection stays open
```

Each UDP datagram sent through the relay includes a small header with the destination address and port:

```python
[
    0x00, 0x00,    # RSV: Reserved
    0x00,          # FRAG: Fragment number (0 = no fragmentation)
    0x01,          # ATYP: Address type
    *dst_addr,     # DST.ADDR: Destination address
    *dst_port,     # DST.PORT: Destination port
    *data          # DATA: Application data
]
```

The TCP control connection must remain open for the duration of the UDP association. If it closes, the proxy drops the UDP relay.

!!! warning "UDP in Chrome"
    Chrome does not use SOCKS5 UDP ASSOCIATE for any traffic. Even when configured with a SOCKS5 proxy, Chrome only proxies TCP connections. WebRTC, DNS-over-UDP, and other UDP traffic are not routed through the SOCKS5 proxy. This means WebRTC IP leaks are still possible with SOCKS5 in Chrome. Use `--force-webrtc-ip-handling-policy=disable_non_proxied_udp` or Pydoll's `webrtc_leak_protection = True` to mitigate this. For more details, see [Network Fundamentals: WebRTC and IP Leakage](./network-fundamentals.md#webrtc-and-ip-leakage).

!!! tip "Modern UDP Proxying Alternatives"
    For scenarios requiring full UDP support beyond what Chrome's SOCKS5 implementation provides, consider Shadowsocks (encrypted SOCKS-like protocol with native UDP), WireGuard (VPN with excellent performance), or V2Ray/VMess (flexible proxy framework with comprehensive UDP handling).

## DNS Resolution

A common misconception is that HTTP proxies leak DNS queries while SOCKS5 proxies do not. The reality in Chrome is more nuanced.

When Chrome is configured with any proxy (HTTP, HTTPS, or SOCKS5), it sends hostnames to the proxy rather than resolving DNS locally. For HTTP proxies, the hostname appears in the `CONNECT host:443` request. For SOCKS5, it appears in the connection request with ATYP=0x03 (domain name). In both cases, the proxy resolves DNS on its side, and Chrome does not make local DNS queries for proxied traffic.

The real DNS privacy difference between the two proxy types is not who resolves DNS, but what the proxy sees at the application layer. An HTTP proxy sees the full URL for unencrypted requests and the hostname for CONNECT requests. A SOCKS5 proxy sees only the destination hostname and port as opaque connection parameters.

However, there is an important caveat: Chrome's DNS prefetcher can make local DNS queries for hostnames found in page content, even when a proxy is configured. This can leak the domains you are browsing to your local DNS resolver. To prevent this, disable DNS prefetching or use the flag `--host-resolver-rules="MAP * ~NOTFOUND , EXCLUDE 127.0.0.1"`.

!!! note "`socks5://` vs `socks5h://`"
    Many tools outside Chrome distinguish between `socks5://` (client resolves DNS) and `socks5h://` (proxy resolves DNS, the "h" stands for hostname). Chrome always resolves DNS proxy-side for SOCKS5, behaving like `socks5h://` regardless of which scheme you use. But if you use tools like `curl`, Firefox, or Python libraries alongside Pydoll, the distinction matters: always use `socks5h://` to prevent DNS leaks.

## SOCKS5 and MITM Resistance

SOCKS5 is often described as "MITM-resistant." This is true in a specific sense: because SOCKS5 does not understand or interact with TLS, it has no mechanism to terminate a TLS connection and re-encrypt it. A SOCKS5 proxy simply relays encrypted bytes without modification.

An HTTP proxy, by contrast, can perform TLS termination (MITM) by presenting its own certificate to the client, decrypting the traffic, inspecting or modifying it, and re-encrypting it toward the server. This requires the client to trust the proxy's CA certificate, and it is detectable through certificate pinning and Certificate Transparency logs. The normal behavior of an HTTP proxy with HTTPS (using CONNECT) is to create a transparent tunnel without termination, but the architectural possibility of MITM exists.

With SOCKS5, TLS termination is not possible at the protocol level. The proxy cannot inject itself into the TLS handshake because it does not parse the application data flowing through it. The end-to-end encryption between client and server is preserved by design.

It is worth noting that TLS is what provides the actual cryptographic protection, not SOCKS5 itself. If you send unencrypted HTTP through a SOCKS5 proxy, the proxy operator can read everything. The security advantage of SOCKS5 is architectural (it does not require or enable TLS termination), not cryptographic.

## TLS and Browser Fingerprinting Through SOCKS5

An important limitation to understand: SOCKS5 does not change your browser's fingerprint. The TLS handshake (ClientHello) passes through the SOCKS5 proxy byte-for-byte, which means the target server sees your browser's exact JA3/JA4 fingerprint. The same applies to HTTP/2 SETTINGS frames, browser-specific header ordering, and all other application-layer fingerprinting signals.

SOCKS5 hides your IP address and prevents the proxy from injecting identifying headers. It does not help with any form of browser or behavioral fingerprinting. For a complete evasion strategy, you need to address fingerprinting at multiple layers. See [Evasion Techniques](../fingerprinting/evasion-techniques.md) for details.

## SOCKS5 Authentication in Chrome

Chrome does not support SOCKS5 username/password authentication. This is a longstanding limitation tracked as [Chromium Issue #40323993](https://issues.chromium.org/issues/40323993). When Chrome performs the SOCKS5 method negotiation, it only offers method `0x00` (no authentication). If the proxy requires authentication, the connection fails silently.

This is fundamentally different from HTTP proxy authentication. HTTP proxies authenticate via HTTP status codes (`407 Proxy Authentication Required`), which Chrome handles through the Fetch domain in CDP. Pydoll intercepts these `Fetch.authRequired` events and responds with stored credentials automatically. SOCKS5 authentication, on the other hand, happens during a binary protocol handshake at the session layer, before any HTTP traffic exists. There is no HTTP 407, no `Fetch.authRequired` event, and no way for CDP-based tools to inject credentials into this process.

Configuring `--proxy-server=socks5://user:pass@proxy:1080` does not work. Chrome silently ignores the embedded credentials.

### Pydoll's SOCKS5Forwarder

The standard solution is a local proxy forwarder: a lightweight SOCKS5 server running on localhost that accepts unauthenticated connections from Chrome and forwards them to the remote proxy with full authentication.

```mermaid
sequenceDiagram
    participant Chrome
    participant Forwarder as Local Forwarder<br/>(127.0.0.1:1081)
    participant Remote as Remote SOCKS5 Proxy<br/>(proxy:1080)
    participant Server as Destination Server

    Note over Chrome,Forwarder: No authentication
    Chrome->>Forwarder: SOCKS5 Hello [methods: 0x00]
    Forwarder->>Chrome: Method selected [0x00]
    Chrome->>Forwarder: CONNECT example.com:443

    Note over Forwarder,Remote: With authentication
    Forwarder->>Remote: SOCKS5 Hello [methods: 0x02]
    Remote->>Forwarder: Method selected [0x02]
    Forwarder->>Remote: Auth [username, password]
    Remote->>Forwarder: Auth OK
    Forwarder->>Remote: CONNECT example.com:443
    Remote->>Server: TCP connection
    Remote->>Forwarder: Connect OK

    Forwarder->>Chrome: Connect OK

    Note over Chrome,Server: Bidirectional data relay
    Chrome->>Forwarder: TLS + application data
    Forwarder->>Remote: Forward
    Remote->>Server: Forward
    Server->>Remote: Response
    Remote->>Forwarder: Forward
    Forwarder->>Chrome: Forward
```

Pydoll provides a built-in `SOCKS5Forwarder` in the `pydoll.utils` module. It is a pure-Python, zero-dependency async implementation that handles the full SOCKS5 handshake with the remote proxy, including username/password authentication (RFC 1929), IPv4, IPv6, and domain address types.

```python
import asyncio
from pydoll.utils import SOCKS5Forwarder
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def main():
    forwarder = SOCKS5Forwarder(
        remote_host='proxy.example.com',
        remote_port=1080,
        username='myuser',
        password='mypass',
        local_port=1081,  # Use 0 for auto-assigned port
    )
    async with forwarder:
        options = ChromiumOptions()
        options.add_argument(f'--proxy-server=socks5://127.0.0.1:{forwarder.local_port}')

        async with Chrome(options=options) as browser:
            tab = await browser.start()
            await tab.go_to('https://httpbin.org/ip')

asyncio.run(main())
```

The forwarder can also run as a standalone CLI tool for testing or use with other applications:

```bash
python -m pydoll.utils.socks5_proxy_forwarder \
    --remote-host proxy.example.com \
    --remote-port 1080 \
    --username myuser \
    --password mypass \
    --local-port 1081
```

The forwarder binds to `127.0.0.1` by default, making it accessible only from your machine. Never bind to `0.0.0.0` in production, as this would expose an unauthenticated SOCKS5 proxy to the network. Credentials are never logged in plaintext. The forwarder adds sub-millisecond latency since all communication happens over the local loopback interface.

!!! tip "Restricted Environments"
    Some environments (Docker containers, serverless platforms, hardened VMs) may restrict binding to local ports. Use `local_port=0` to let the OS assign an available port. If local binding is completely blocked, consider using an HTTP CONNECT proxy instead, which Chrome supports natively with authentication via Pydoll's ProxyManager.

## Practical Configuration

**Basic SOCKS5 (no authentication):**

```python
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.add_argument('--proxy-server=socks5://proxy.example.com:1080')

async with Chrome(options=options) as browser:
    tab = await browser.start()
    await tab.go_to('https://example.com')
```

**SOCKS5 with authentication (via SOCKS5Forwarder):**

See the [SOCKS5Forwarder section](#pydolls-socks5forwarder) above.

**Preventing leaks:**

For a complete SOCKS5 setup, you should also prevent WebRTC and DNS prefetch leaks:

```python
options = ChromiumOptions()
options.add_argument('--proxy-server=socks5://proxy.example.com:1080')
options.webrtc_leak_protection = True  # Prevents WebRTC IP leaks
options.add_argument('--disable-quic')  # Forces HTTP/2 over TCP through proxy
```

**Testing your setup:**

Always verify your proxy configuration with leak tests. Visit [browserleaks.com/ip](https://browserleaks.com/ip) to confirm your IP, [browserleaks.com/webrtc](https://browserleaks.com/webrtc) to check for WebRTC leaks, and [dnsleaktest.com](https://dnsleaktest.com/) to verify DNS is not leaking.

## Summary

SOCKS5 provides protocol-agnostic proxying with a smaller trust surface than HTTP proxies. It does not parse, modify, or inject anything into your traffic. DNS resolution happens proxy-side in Chrome. TLS encryption is preserved end-to-end. The main limitation in Chrome is the lack of native SOCKS5 authentication (solved by Pydoll's `SOCKS5Forwarder`) and the absence of UDP proxying (mitigated by disabling WebRTC or using the appropriate browser flags).

SOCKS5 does not change your browser's TLS fingerprint, HTTP/2 settings, or any application-layer characteristics. For complete evasion, combine SOCKS5 with browser fingerprint management and behavioral simulation.

**Next steps:**

- [Proxy Detection](./proxy-detection.md): How even SOCKS5 proxies can be detected
- [Building Proxies](./build-proxy.md): Implement your own SOCKS5 server
- [Proxy Configuration](../../features/configuration/proxy.md): Practical Pydoll proxy setup
- [Evasion Techniques](../fingerprinting/evasion-techniques.md): Multi-layer evasion strategy

## References

- RFC 1928: SOCKS Protocol Version 5 (1996) - https://datatracker.ietf.org/doc/html/rfc1928
- RFC 1929: Username/Password Authentication for SOCKS V5 (1996) - https://datatracker.ietf.org/doc/html/rfc1929
- RFC 1961: GSS-API Authentication Method for SOCKS V5 (1996) - https://datatracker.ietf.org/doc/html/rfc1961
- RFC 3089: SOCKS-based IPv6/IPv4 Gateway Mechanism (2001) - https://datatracker.ietf.org/doc/html/rfc3089
- Chromium Proxy Documentation - https://chromium.googlesource.com/chromium/src/+/689912289c/net/docs/proxy.md
- Chromium Issue #40323993: SOCKS5 Authentication - https://issues.chromium.org/issues/40323993
- BrowserLeaks: WebRTC Leak Test - https://browserleaks.com/webrtc
- DNS Leak Test - https://dnsleaktest.com/
- IPLeak: Comprehensive Leak Testing - https://ipleak.net


================================================
FILE: docs/en/features/advanced/behavioral-captcha-bypass.md
================================================
# Cloudflare Turnstile Interaction

Pydoll provides native support for interacting with Cloudflare Turnstile captchas by performing realistic browser clicks. This is **not a bypass or circumvention**. It simply automates the same click action a human would perform on the captcha checkbox.

!!! warning "What This Feature Actually Does"
    This feature **clicks** on the Cloudflare Turnstile captcha checkbox using standard browser interactions. That's it. There is no:
    
    - **NO**: Magic bypass or circumvention
    - **NO**: Challenge solving (image selection, puzzles, etc.)
    - **NO**: Score manipulation or fingerprint spoofing
    - **YES**: Just a realistic click on the captcha container
    
    **Success depends entirely on your environment** (IP reputation, browser fingerprint, behavior patterns). Pydoll provides the mechanism to click; your environment determines if the click is accepted.

!!! info "What Is Cloudflare Turnstile?"
    Cloudflare Turnstile is a modern captcha system that analyzes browser environment and behavioral signals to determine if you're human. It typically shows as a checkbox that users must click. The system analyzes:
    
    - **IP reputation**: Is your IP address flagged or suspicious?
    - **Browser fingerprint**: Does your browser look legitimate?
    - **Behavioral patterns**: Do you behave like a human?
    
    When trust score is high enough, the checkbox click is accepted. When it's too low, Turnstile may show a challenge (which Pydoll **cannot solve**) or block you entirely. For image or puzzle challenges, consider using **[CapSolver](https://dashboard.capsolver.com/passport/register?inviteCode=WPhTbOsbXEpc)**.

## Quick Start

### Context Manager (Recommended)

The context manager waits for the captcha to appear, clicks it, and waits for resolution before continuing:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def turnstile_example():
    options = ChromiumOptions()
    options.add_argument('--disable-blink-features=AutomationControlled')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Context manager handles captcha automatically
        async with tab.expect_and_bypass_cloudflare_captcha():
            await tab.go_to('https://site-with-turnstile.com')
        
        # This code only runs after captcha is clicked
        print("Turnstile captcha interaction complete!")
        
        # Continue with your automation
        content = await tab.find(id='protected-content')
        print(await content.text)

asyncio.run(turnstile_example())
```

### Background Processing

Enable automatic captcha clicking in the background:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def background_turnstile():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Enable automatic clicking before navigating
        await tab.enable_auto_solve_cloudflare_captcha()
        
        # Navigate to protected site
        await tab.go_to('https://site-with-turnstile.com')
        
        # Wait for captcha to be processed in background
        await asyncio.sleep(5)
        
        print("Page loaded with background captcha handling")
        
        # Disable when no longer needed
        await tab.disable_auto_solve_cloudflare_captcha()

asyncio.run(background_turnstile())
```

## Customizing Captcha Interaction

### How It Works

Pydoll automatically detects Cloudflare Turnstile by traversing the page's shadow DOM. It looks for a shadow root containing `challenges.cloudflare.com`, navigates into its cross-origin iframe, finds the inner shadow root, and clicks the actual checkbox element. No manual selector configuration is needed.

### Timing Configuration

The captcha shadow root doesn't always appear immediately. Adjust the timeout to match the site's behavior:

```python
async def timing_configuration_example():
    async with Chrome() as browser:
        tab = await browser.start()

        async with tab.expect_and_bypass_cloudflare_captcha(
            time_to_wait_captcha=10   # Wait up to 10 seconds for captcha to appear (default: 5)
        ):
            await tab.go_to('https://site-with-slow-turnstile.com')

        print("Captcha interaction complete with custom timing!")

asyncio.run(timing_configuration_example())
```

**Parameter Reference:**

| Parameter | Type | Default | Description |
|-----------|------|---------|-------------|
| `time_to_wait_captcha` | `float` | `5` | Maximum seconds to wait for captcha to appear |

!!! info "Why Timing Matters"
    Some sites load the captcha asynchronously. If the Cloudflare shadow root doesn't appear within `time_to_wait_captcha`, the interaction is skipped.

## Other Captcha Systems

### reCAPTCHA v3 (Invisible)

reCAPTCHA v3 is **completely invisible** and requires **no interaction**. Just navigate normally:

```python
async def recaptcha_v3_example():
    options = ChromiumOptions()
    options.add_argument('--disable-blink-features=AutomationControlled')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # No special handling needed - just navigate
        await tab.go_to('https://site-with-recaptcha-v3.com')
        
        # reCAPTCHA v3 runs in background, analyzing your behavior
        await asyncio.sleep(3)
        
        # Continue with form submission
        submit_button = await tab.find(id='submit-btn')
        await submit_button.click()

asyncio.run(recaptcha_v3_example())
```

!!! note "reCAPTCHA v3 Success Factors"
    Since reCAPTCHA v3 is entirely passive (no interaction), success depends on:
    
    - **IP reputation**: Use residential proxies with good reputation
    - **Browser fingerprint**: Configure realistic browser preferences
    - **Behavioral patterns**: Spend time on page, scroll naturally, type realistically
    
    If your score is too low, some sites may show a reCAPTCHA v2 challenge (which Pydoll **cannot solve**).

## What Determines Success?

The success of captcha interaction depends **entirely on your environment**, not on Pydoll. The captcha system analyzes:

### 1. IP Reputation (Most Critical)

| IP Type | Trust Level | Expected Behavior |
|---------|-------------|-------------------|
| **Residential IP (clean)** | High | Generally accepted without challenges |
| **Mobile IP** | High | Generally accepted without challenges |
| **Datacenter IP** | Low | Often blocked or challenged |
| **Previously blocked IP** | Very Low | Almost always blocked or challenged |

!!! danger "IP Reputation is Everything"
    **No tool can overcome a bad IP address.** If your IP is flagged, you will be blocked or challenged regardless of how realistic your browser looks.
    
    Use residential proxies with good reputation for best results.

### 2. Browser Fingerprint

Configure your browser to look legitimate:

```python
import time
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def stealth_configuration():
    options = ChromiumOptions()
    
    # Stealth arguments
    options.add_argument('--disable-blink-features=AutomationControlled')
    options.add_argument('--window-size=1920,1080')
    
    # Realistic browser preferences
    current_time = int(time.time())
    options.browser_preferences = {
        'profile': {
            'last_engagement_time': str(current_time - (3 * 60 * 60)),  # 3 hours ago
            'exited_cleanly': True,
            'exit_type': 'Normal',
        },
        'safebrowsing': {'enabled': True},
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        async with tab.expect_and_bypass_cloudflare_captcha():
            await tab.go_to('https://site-with-turnstile.com')

asyncio.run(stealth_configuration())
```

### 3. Behavioral Patterns

Captcha systems analyze how you interact with the page:

```python
async def realistic_behavior():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://site-with-turnstile.com')
        
        # Simulate human behavior before captcha appears
        await asyncio.sleep(2)  # Read page content
        await tab.execute_script('window.scrollBy(0, 300)')  # Scroll
        await asyncio.sleep(1)
        
        # Now interact with captcha
        async with tab.expect_and_bypass_cloudflare_captcha():
            # The captcha interaction happens here
            pass
        
        print("Captcha passed with realistic behavior!")

asyncio.run(realistic_behavior())
```

!!! tip "Behavioral Fingerprinting"
    For in-depth understanding of how behavioral patterns affect captcha success, see **[Behavioral Fingerprinting](../../deep-dive/fingerprinting/behavioral-fingerprinting.md)**. This guide explains:
    
    - Mouse movement patterns and detection
    - Keystroke timing analysis
    - Scroll behavior physics
    - Event sequence analysis
    
    Understanding these concepts can help you build more realistic automation that achieves higher success rates.

## Troubleshooting

### Captcha Not Being Clicked

**Symptoms**: Captcha appears but is never clicked, page stays on challenge.

**Possible Causes:**

1. **Timing too short**: Captcha hasn't loaded yet when Pydoll tries to click
2. **Shadow root not found**: The Cloudflare Turnstile shadow root hasn't appeared in the DOM yet

**Solutions:**

```python
async def troubleshooting_example():
    async with Chrome() as browser:
        tab = await browser.start()

        # Increase wait times
        async with tab.expect_and_bypass_cloudflare_captcha(
            time_before_click=5,     # Longer delay before clicking
            time_to_wait_captcha=15  # More time to find captcha
        ):
            await tab.go_to('https://problematic-site.com')

asyncio.run(troubleshooting_example())
```

### Captcha Clicked but Shows Challenge

**Symptoms**: Checkbox shows checkmark briefly, then presents an image/puzzle challenge.

**Root Cause**: Your environment's trust score is too low.

**Solutions:**

- Use residential proxies with good reputation
- Configure realistic browser fingerprint
- Add more realistic behavioral patterns (scrolling, mouse movement, delays)
- **Note**: Pydoll cannot solve the challenge itself. If you need automated captcha solving, consider integrating with **[CapSolver](https://dashboard.capsolver.com/passport/register?inviteCode=WPhTbOsbXEpc)**

### "Access Denied" or Immediate Block

**Symptoms**: Site immediately shows "Access Denied" or blocks you without showing captcha.

**Root Cause**: **Your IP address is flagged.**

**Solutions:**

- Use different residential proxy with good reputation
- Rotate IPs between requests
- Test your IP at `https://www.cloudflare.com/cdn-cgi/trace`
- **Note**: No amount of browser configuration will fix a flagged IP

### Works Locally but Fails in Docker/CI

**Symptoms**: Captcha interaction works on your machine but fails in Docker/CI environments.

**Root Cause**: Datacenter IPs are heavily scrutinized by captcha systems.

**Solutions:**

1. **Use headless mode with proper display** (for full rendering):
   ```dockerfile
   FROM python:3.11-slim
   
   RUN apt-get update && apt-get install -y \
       chromium \
       chromium-driver \
       xvfb \
       && rm -rf /var/lib/apt/lists/*
   
   ENV DISPLAY=:99
   
   CMD Xvfb :99 -screen 0 1920x1080x24 & python your_script.py
   ```

2. **Use residential proxy** even in CI/CD:
   ```python
   options = ChromiumOptions()
   options.add_argument('--proxy-server=http://user:pass@residential-proxy.com:8080')
   ```

## Best Practices

1. **Use residential proxies**: IP reputation is the most critical factor
2. **Configure stealth options**: Remove automation indicators
3. **Add behavioral patterns**: Scroll, wait, move mouse before clicking
4. **Adjust timing**: Give captcha time to load before attempting click
5. **Handle failures gracefully**: Have fallback logic when captcha cannot be passed
6. **Test your environment**: Verify IP reputation and browser fingerprint before automation

## Ethical Guidelines

!!! danger "Terms of Service and Legal Compliance"
    Interacting with captchas may violate a website's Terms of Service even if technically possible. **Always check and respect ToS** before automating any website.
    
    This feature is provided for **legitimate automation purposes only**:
    
    **Appropriate use cases:**
    - Automated testing of your own applications
    - Monitoring services you have permission to monitor
    - Research and security analysis with proper authorization
    
    **Inappropriate use cases:**
    - Scraping content you don't have permission to access
    - Circumventing paywalls or subscription systems
    - Denial-of-service attacks or aggressive scraping
    - Any activity that violates Terms of Service

## See Also

- **[Browser Options](../configuration/browser-options.md)** - Stealth configuration
- **[Browser Preferences](../configuration/browser-preferences.md)** - Advanced fingerprinting
- **[Proxy Configuration](../configuration/proxy.md)** - Setting up proxies
- **[Behavioral Fingerprinting](../../deep-dive/fingerprinting/behavioral-fingerprinting.md)** - Understanding behavioral detection
- **[Human-Like Interactions](../automation/human-interactions.md)** - Realistic behavior patterns

---

**Remember**: Pydoll provides the mechanism to click on captchas, but your environment (IP, fingerprint, behavior) determines success. This is not a magic solution, it's a tool that works when used in the right environment with proper configuration. For challenges that require image recognition or puzzle solving, consider using **[CapSolver](https://dashboard.capsolver.com/passport/register?inviteCode=WPhTbOsbXEpc)** — use code **PYDOLL** for an extra 6% balance bonus.


================================================
FILE: docs/en/features/advanced/decorators.md
================================================
# Retry Decorator

Web scraping is inherently unpredictable. Networks fail, pages load slowly, elements appear and disappear, rate limits kick in, and CAPTCHAs show up unexpectedly. The `@retry` decorator provides a robust, battle-tested solution for handling these inevitable failures gracefully.

## Why Use the Retry Decorator?

In production scraping, failures aren't exceptions, they're the norm. Instead of letting your entire scraping job crash because of a temporary network hiccup or a missing element, the retry decorator allows you to:

- **Recover automatically** from transient failures
- **Implement sophisticated retry strategies** with exponential backoff
- **Execute recovery logic** before retrying (refresh page, switch proxy, restart browser)
- **Keep your business logic clean** without polluting it with error handling code

## Quick Start

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.decorators import retry
from pydoll.exceptions import WaitElementTimeout, NetworkError

@retry(max_retries=3, exceptions=[WaitElementTimeout, NetworkError])
async def scrape_product_page(url: str):
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to(url)
        
        # This might fail due to network issues or slow loading
        product_title = await tab.find(class_name='product-title', timeout=5)
        return await product_title.text

asyncio.run(scrape_product_page('https://example.com/product/123'))
```

If `scrape_product_page` fails with a `WaitElementTimeout` or `NetworkError`, it will automatically retry up to 3 times before giving up.

## Best Practice: Always Specify Exceptions

!!! warning "Critical Best Practice"
    **ALWAYS** specify which exceptions should trigger a retry. Using the default `exceptions=Exception` will catch **everything**, including bugs in your code that should fail immediately.

**Bad (catches everything, including bugs):**

```python
@retry(max_retries=3)  # DON'T DO THIS
async def scrape_data():
    data = response['items'][0]  # If 'items' doesn't exist, retries won't help!
    return data
```

**Good (only retries on expected failures):**

```python
from pydoll.exceptions import ElementNotFound, WaitElementTimeout, NetworkError

@retry(
    max_retries=3,
    exceptions=[ElementNotFound, WaitElementTimeout, NetworkError]
)
async def scrape_data():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        return await tab.find(id='data-container', timeout=10)
```

By specifying exceptions, you ensure that:

- **Logic errors fail fast** (typos, wrong selectors, code bugs)
- **Only recoverable errors are retried** (network issues, timeouts, missing elements)
- **Debugging is easier** (you know exactly what went wrong)

## Parameters

### max_retries

Maximum number of retry attempts before giving up.

```python
from pydoll.exceptions import WaitElementTimeout

@retry(max_retries=5, exceptions=[WaitElementTimeout])
async def fetch_data():
    # Will try up to 5 times total
    pass
```

### exceptions

Exception types that should trigger a retry. Can be a single exception or a list.

```python
from pydoll.exceptions import (
    ElementNotFound,
    WaitElementTimeout,
    NetworkError,
    ElementNotInteractable
)

# Single exception
@retry(exceptions=[WaitElementTimeout])
async def example1():
    pass

# Multiple exceptions
@retry(exceptions=[WaitElementTimeout, NetworkError, ElementNotFound, ElementNotInteractable])
async def example2():
    pass
```

!!! tip "Common Scraping Exceptions"
    For web scraping with Pydoll, you'll typically want to retry on:

    - `WaitElementTimeout` - Timeout waiting for element to appear
    - `ElementNotFound` - Element doesn't exist in DOM
    - `ElementNotVisible` - Element exists but is not visible
    - `ElementNotInteractable` - Element cannot receive interaction
    - `NetworkError` - Network connectivity issues
    - `ConnectionFailed` - Failed to connect to browser
    - `PageLoadTimeout` - Page load timed out
    - `ClickIntercepted` - Click was intercepted by another element

### delay

Time to wait between retry attempts (in seconds).

```python
from pydoll.exceptions import WaitElementTimeout

@retry(max_retries=3, exceptions=[WaitElementTimeout], delay=2.0)
async def scrape_with_delay():
    # Waits 2 seconds between each retry
    pass
```

### exponential_backoff

When `True`, increases the delay exponentially with each retry attempt.

```python
from pydoll.exceptions import NetworkError

@retry(
    max_retries=5,
    exceptions=[NetworkError],
    delay=1.0,
    exponential_backoff=True
)
async def scrape_with_backoff():
    # Attempt 1: fails → wait 1 second
    # Attempt 2: fails → wait 2 seconds
    # Attempt 3: fails → wait 4 seconds
    # Attempt 4: fails → wait 8 seconds
    # Attempt 5: fails → raise exception
    pass
```

**What is Exponential Backoff?**

Exponential backoff is a retry strategy where the wait time between attempts increases exponentially. Instead of hammering a server with requests every second, you give it progressively more time to recover:

- **Attempt 1**: Wait `delay` seconds (e.g., 1s)
- **Attempt 2**: Wait `delay * 2` seconds (e.g., 2s)
- **Attempt 3**: Wait `delay * 4` seconds (e.g., 4s)
- **Attempt 4**: Wait `delay * 8` seconds (e.g., 8s)

This is especially useful when:

- Dealing with **rate limits** (give the server time to reset)
- Handling **temporary server overload** (don't make it worse)
- Waiting for **slow-loading dynamic content**
- Avoiding **detection as a bot** (natural-looking retry patterns)

### on_retry

A callback function executed after each failed attempt, before the next retry. Must be an **async function**.

```python
from pydoll.exceptions import WaitElementTimeout

@retry(
    max_retries=3,
    exceptions=[WaitElementTimeout],
    on_retry=my_recovery_function
)
async def scrape_data():
    pass
```

The callback can be:

- **A standalone async function**
- **A class method** (receives `self` automatically)

## The on_retry Callback: Your Recovery Mechanism

The `on_retry` callback is where the real magic happens. This is your opportunity to **restore the application state** before the next retry attempt.

### Standalone Function

```python
import asyncio
from pydoll.decorators import retry
from pydoll.exceptions import WaitElementTimeout

async def log_retry():
    print("Retry attempt failed, waiting before next attempt...")
    await asyncio.sleep(1)

@retry(max_retries=3, exceptions=[WaitElementTimeout], on_retry=log_retry)
async def scrape_page():
    # Your scraping logic
    pass
```

### Class Method

When using the decorator inside a class, the callback can be a class method. It will automatically receive `self` as the first argument.

```python
import asyncio
from pydoll.decorators import retry
from pydoll.exceptions import WaitElementTimeout

class DataCollector:
    def __init__(self):
        self.retry_count = 0
    
    # IMPORTANT: Define callback BEFORE the decorated method
    async def log_retry(self):
        self.retry_count += 1
        print(f"Attempt {self.retry_count} failed, retrying...")
        await asyncio.sleep(1)
    
    @retry(
        max_retries=3,
        exceptions=[WaitElementTimeout],
        on_retry=log_retry  # No 'self.' prefix needed
    )
    async def fetch_data(self):
        # Your scraping logic here
        pass
```

!!! warning "Method Definition Order Matters"
    When using `on_retry` with class methods, **you must define the callback method BEFORE the decorated method** in your class definition. Python needs to know about the callback when the decorator is applied.

    **Wrong (will fail):**

    ```python
    class Scraper:
        @retry(on_retry=handle_retry)  # handle_retry doesn't exist yet!
        async def scrape(self):
            pass
        
        async def handle_retry(self):  # Defined too late
            pass
    ```

    **Correct:**

    ```python
    class Scraper:
        async def handle_retry(self):  # Defined first
            pass
        
        @retry(on_retry=handle_retry)  # Now it exists
        async def scrape(self):
            pass
    ```

## Real-World Use Cases

### 1. Page Refresh and State Recovery

**This is the most powerful use of `on_retry`**: recovering from failures by refreshing the page and restoring your application state. This example demonstrates why the retry decorator is so valuable for production scraping.

```python
from pydoll.browser.chromium import Chrome
from pydoll.decorators import retry
from pydoll.exceptions import ElementNotFound, WaitElementTimeout
from pydoll.constants import Key
import asyncio

class DataScraper:
    def __init__(self):
        self.browser = None
        self.tab = None
        self.current_page = 1
    
    async def recover_from_failure(self):
        """Refresh page and restore state before retry"""
        print(f"Recovering... refreshing page {self.current_page}")
        
        if self.tab:
            # Refresh the page to recover from stale elements or bad state
            await self.tab.refresh()
            await asyncio.sleep(2)  # Wait for page to load
            
            # Restore state: navigate back to the correct page
            if self.current_page > 1:
                page_input = await self.tab.find(id='page-number')
                await page_input.insert_text(str(self.current_page))
                await self.tab.keyboard.press(Key.ENTER)
                await asyncio.sleep(1)
    
    @retry(
        max_retries=3,
        exceptions=[ElementNotFound, WaitElementTimeout],
        on_retry=recover_from_failure,
        delay=1.0
    )
    async def scrape_page_data(self):
        """Scrape data from the current page"""
        if not self.browser:
            self.browser = Chrome()
            self.tab = await self.browser.start()
            await self.tab.go_to('https://example.com/data')
        
        # Navigate to specific page
        page_input = await self.tab.find(id='page-number')
        await page_input.insert_text(str(self.current_page))
        await self.tab.keyboard.press(Key.ENTER)
        await asyncio.sleep(1)
        
        # Scrape data (might fail if elements become stale)
        items = await self.tab.find(class_name='data-item', find_all=True)
        return [await item.text for item in items]
    
    async def scrape_multiple_pages(self, start_page: int, end_page: int):
        """Scrape multiple pages with automatic retry on failures"""
        results = []
        for page_num in range(start_page, end_page + 1):
            self.current_page = page_num
            data = await self.scrape_page_data()
            results.extend(data)
        return results

# Usage
async def main():
    scraper = DataScraper()
    try:
        # Scrape pages 1-10 with automatic recovery on failures
        all_data = await scraper.scrape_multiple_pages(1, 10)
        print(f"Scraped {len(all_data)} items")
    finally:
        if scraper.browser:
            await scraper.browser.stop()
```

**What makes this powerful:**

- `recover_from_failure()` actually **restores the state** by refreshing and navigating back
- The `scrape_page_data()` method stays clean, focused only on scraping logic
- If elements become stale or disappear, the retry mechanism handles recovery automatically
- The browser persists across retries via `self.browser` and `self.tab`

### 2. Modal Dialog Recovery

Sometimes a modal or overlay appears unexpectedly and blocks your automation. Close it and retry.

```python
from pydoll.browser.chromium import Chrome
from pydoll.decorators import retry
from pydoll.exceptions import ElementNotFound

class ModalAwareScraper:
    def __init__(self):
        self.tab = None
    
    async def close_modals(self):
        """Close any blocking modals before retry"""
        print("Checking for blocking modals...")
        
        # Try to find and close common modals
        modal_close = await self.tab.find(
            class_name='modal-close',
            timeout=2,
            raise_exc=False
        )
        if modal_close:
            print("Found modal, closing it...")
            await modal_close.click()
            await asyncio.sleep(0.5)
    
    @retry(
        max_retries=3,
        exceptions=[ElementNotFound],
        on_retry=close_modals,
        delay=0.5
    )
    async def click_button(self, button_id: str):
        button = await self.tab.find(id=button_id)
        await button.click()
```

### 3. Browser Restart and Proxy Rotation

For heavy scraping jobs, you might need to completely restart the browser and switch proxies after failures.

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions
from pydoll.decorators import retry
from pydoll.exceptions import NetworkError, PageLoadTimeout

class RobustScraper:
    def __init__(self):
        self.browser = None
        self.tab = None
        self.proxy_list = [
            'proxy1.example.com:8080',
            'proxy2.example.com:8080',
            'proxy3.example.com:8080',
        ]
        self.current_proxy_index = 0
    
    async def restart_with_new_proxy(self):
        """Restart browser with a different proxy"""
        print("Restarting browser with new proxy...")
        
        # Close current browser
        if self.browser:
            await self.browser.stop()
            await asyncio.sleep(2)
        
        # Rotate to next proxy
        self.current_proxy_index = (self.current_proxy_index + 1) % len(self.proxy_list)
        proxy = self.proxy_list[self.current_proxy_index]
        
        print(f"Using proxy: {proxy}")
        
        # Start new browser with new proxy
        options = ChromiumOptions()
        options.add_argument(f'--proxy-server={proxy}')
        
        self.browser = Chrome(options=options)
        self.tab = await self.browser.start()
    
    @retry(
        max_retries=3,
        exceptions=[NetworkError, PageLoadTimeout],
        on_retry=restart_with_new_proxy,
        delay=5.0,
        exponential_backoff=True
    )
    async def scrape_protected_site(self, url: str):
        if not self.browser:
            await self.restart_with_new_proxy()
        
        await self.tab.go_to(url)
        await asyncio.sleep(3)
        
        # Your scraping logic here
        content = await self.tab.find(id='content')
        return await content.text
```

### 4. Network Idle Detection with Retry

Wait for all network activity to complete, with retry logic if the page never stabilizes.

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.decorators import retry
from pydoll.exceptions import TimeoutException

class NetworkAwareScraper:
    def __init__(self):
        self.tab = None
    
    async def reload_page(self):
        """Reload page if network never stabilized"""
        print("Page didn't stabilize, reloading...")
        if self.tab:
            await self.tab.refresh()
            await asyncio.sleep(2)
    
    @retry(
        max_retries=2,
        exceptions=[TimeoutException],
        on_retry=reload_page,
        delay=3.0
    )
    async def wait_for_page_ready(self):
        """Wait for all network requests to complete"""
        await self.tab.enable_network_events()
        
        # Wait for network idle (no requests for 2 seconds)
        idle_time = 0
        max_wait = 10
        
        while idle_time < max_wait:
            # Check if any requests are in flight
            # (Implementation depends on your event tracking)
            await asyncio.sleep(0.5)
            idle_time += 0.5
        
        if idle_time >= max_wait:
            raise TimeoutException("Network never stabilized")
```

### 5. CAPTCHA Detection and Recovery

Detect when a CAPTCHA appears and take appropriate action.

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.decorators import retry
from pydoll.exceptions import ElementNotFound

class CaptchaScraper:
    def __init__(self):
        self.tab = None
        self.captcha_count = 0
    
    async def handle_captcha(self):
        """Handle CAPTCHA by waiting or switching strategy"""
        self.captcha_count += 1
        print(f"CAPTCHA detected (count: {self.captcha_count})")
        
        if self.captcha_count > 2:
            print("Too many CAPTCHAs, might need to change strategy...")
            # Could switch to a different approach here
        
        # Wait longer between attempts
        await asyncio.sleep(30)
        
        # Refresh the page
        await self.tab.refresh()
        await asyncio.sleep(5)
    
    @retry(
        max_retries=3,
        exceptions=[ElementNotFound],
        on_retry=handle_captcha,
        delay=10.0,
        exponential_backoff=True
    )
    async def scrape_protected_content(self, url: str):
        if not self.tab:
            browser = Chrome()
            self.tab = await browser.start()
        
        await self.tab.go_to(url)
        
        # Check for CAPTCHA
        captcha = await self.tab.find(
            class_name='g-recaptcha',
            timeout=2,
            raise_exc=False
        )
        
        if captcha:
            raise ElementNotFound("CAPTCHA detected")
        
        # Normal scraping logic
        content = await self.tab.find(class_name='article-content')
        return await content.text
```

## Advanced Patterns

### Combining Multiple Recovery Strategies

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.decorators import retry
from pydoll.exceptions import ElementNotFound, WaitElementTimeout, NetworkError

class AdvancedScraper:
    def __init__(self):
        self.tab = None
        self.attempt = 0
        self.strategies = [
            self.strategy_refresh,
            self.strategy_clear_cache,
            self.strategy_restart_browser,
        ]
    
    async def strategy_refresh(self):
        """Strategy 1: Simple refresh"""
        print("Strategy 1: Refreshing page")
        await self.tab.refresh()
        await asyncio.sleep(2)
    
    async def strategy_clear_cache(self):
        """Strategy 2: Clear cache and refresh"""
        print("Strategy 2: Clearing cache")
        await self.tab.execute_command('Network.clearBrowserCache')
        await self.tab.refresh()
        await asyncio.sleep(3)
    
    async def strategy_restart_browser(self):
        """Strategy 3: Full browser restart"""
        print("Strategy 3: Restarting browser")
        if self.tab:
            await self.tab._browser.stop()
        
        browser = Chrome()
        self.tab = await browser.start()
    
    async def adaptive_recovery(self):
        """Try different recovery strategies based on attempt number"""
        strategy_index = min(self.attempt, len(self.strategies) - 1)
        strategy = self.strategies[strategy_index]
        
        print(f"Attempt {self.attempt + 1}: Using {strategy.__name__}")
        await strategy()
        
        self.attempt += 1
    
    @retry(
        max_retries=3,
        exceptions=[ElementNotFound, WaitElementTimeout, NetworkError],
        on_retry=adaptive_recovery,
        delay=2.0
    )
    async def scrape_with_adaptive_retry(self, url: str):
        await self.tab.go_to(url)
        return await self.tab.find(id='target-content')
```

### Custom Exception for Specific Failure

```python
import asyncio
from pydoll.decorators import retry
from pydoll.exceptions import PydollException

class RateLimitError(PydollException):
    """Raised when rate limit is detected"""
    message = "API rate limit exceeded"

class APIScraper:
    async def wait_for_rate_limit_reset(self):
        """Wait longer when rate limited"""
        print("Rate limit detected, waiting 60 seconds...")
        await asyncio.sleep(60)
    
    @retry(
        max_retries=5,
        exceptions=[RateLimitError],
        on_retry=wait_for_rate_limit_reset,
        delay=10.0,
        exponential_backoff=True
    )
    async def fetch_api_data(self, endpoint: str):
        response = await self.tab.request.get(endpoint)
        
        if response.status == 429:  # Too Many Requests
            raise RateLimitError("API rate limit exceeded")
        
        return response.json()
```

## Best Practices Summary

1. **Always specify exceptions explicitly** - Never use the default `exceptions=Exception`
2. **Use exponential backoff for external services** - Give servers time to recover
3. **Keep retry counts reasonable** - Usually 3-5 attempts is enough
4. **Log retry attempts** - Use `on_retry` to log what's happening
5. **Define callbacks before decorated methods** - Order matters in class definitions
6. **Make callbacks async** - The decorator requires async callbacks
7. **Restore state in callbacks** - Use `on_retry` to navigate back to where you were
8. **Consider the cost of retries** - Each retry consumes time and resources
9. **Combine with other error handling** - Retries don't replace try/except blocks
10. **Test your retry logic** - Ensure recovery callbacks actually work

## Learn More

- **[Exception Handling](../core-concepts.md#error-handling)** - Understanding Pydoll exceptions
- **[Network Events](../network/monitoring.md)** - Track and handle network failures
- **[Browser Options](../configuration/browser-options.md)** - Configure proxies and other settings
- **[Event System](event-system.md)** - Build reactive retry strategies

The retry decorator is a powerful tool that turns fragile scraping scripts into production-ready applications. By combining it with thoughtful recovery strategies, you can build scrapers that gracefully handle the chaos of the real web.


================================================
FILE: docs/en/features/advanced/event-system.md
================================================
# Event System

Pydoll's event system allows you to listen and react to browser activities in real-time. This is essential for building dynamic automation, monitoring network requests, detecting page changes, and creating reactive workflows.

!!! info "Deep Dive Available"
    This guide focuses on practical usage. For architectural details and internal implementation, see [Event Architecture Deep Dive](../../deep-dive/event-architecture.md).

## Prerequisites

Before working with events, you need to enable the corresponding CDP domain:

```python
from pydoll.browser.chromium import Chrome

async with Chrome() as browser:
    tab = await browser.start()
    
    # Enable the domain before listening to events
    await tab.enable_page_events()     # For page lifecycle events
    await tab.enable_network_events()  # For network activity
    await tab.enable_dom_events()      # For DOM changes
```

!!! warning "Events Won't Fire Without Enabling"
    If you register a callback but forget to enable the domain, your callback will never be triggered. Always enable the domain first!

## Basic Event Listening

The `on()` method registers event listeners:

```python
from pydoll.protocol.page.events import PageEvent, LoadEventFiredEvent

async def handle_page_load(event: LoadEventFiredEvent):
    print(f"Page loaded at {event['params']['timestamp']}")

# Register the callback
await tab.enable_page_events()
callback_id = await tab.on(PageEvent.LOAD_EVENT_FIRED, handle_page_load)
```

### Event Structure

All events follow the same structure:

```python
{
    'method': 'Page.loadEventFired',  # Event name
    'params': {                        # Event-specific data
        'timestamp': 123456.789
    }
}
```

Access event data through `event['params']`:

```python
from pydoll.protocol.network.events import RequestWillBeSentEvent

async def handle_request(event: RequestWillBeSentEvent):
    url = event['params']['request']['url']
    method = event['params']['request']['method']
    print(f"{method} {url}")
```

### Using Type Hints for Better IDE Support

Use type hints with event parameter types to get autocomplete for event keys:

```python
from pydoll.protocol.network.events import NetworkEvent, RequestWillBeSentEvent
from pydoll.protocol.page.events import PageEvent, LoadEventFiredEvent

# With type hints - IDE knows all available keys!
async def handle_request(event: RequestWillBeSentEvent):
    # IDE will autocomplete 'params', 'request', 'url', etc.
    url = event['params']['request']['url']
    method = event['params']['request']['method']
    timestamp = event['params']['timestamp']
    print(f"{method} {url} at {timestamp}")

async def handle_load(event: LoadEventFiredEvent):
    # IDE knows this event has 'timestamp' in params
    timestamp = event['params']['timestamp']
    print(f"Page loaded at {timestamp}")

await tab.enable_network_events()
await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, handle_request)

await tab.enable_page_events()
await tab.on(PageEvent.LOAD_EVENT_FIRED, handle_load)
```

!!! tip "Type Hints for Event Parameters"
    All event types are defined in `pydoll.protocol.<domain>.events`. Using them gives you:
    
    - **Autocomplete**: IDE suggests available keys in `event['params']`
    - **Type safety**: Catch typos before running code
    - **Documentation**: See what data each event provides
    
    Event types follow the pattern: `<EventName>Event` (e.g., `RequestWillBeSentEvent`, `ResponseReceivedEvent`)

## Common Event Domains

### Page Events

Monitor page lifecycle and dialogs:

```python
from pydoll.protocol.page.events import PageEvent, JavascriptDialogOpeningEvent

await tab.enable_page_events()

# Page loaded
await tab.on(PageEvent.LOAD_EVENT_FIRED, lambda e: print("Page loaded!"))

# DOM ready
await tab.on(PageEvent.DOM_CONTENT_EVENT_FIRED, lambda e: print("DOM ready!"))

# JavaScript dialog
async def handle_dialog(event: JavascriptDialogOpeningEvent):
    message = event['params']['message']
    dialog_type = event['params']['type']
    print(f"Dialog ({dialog_type}): {message}")
    
    # Handle it automatically
    if await tab.has_dialog():
        await tab.handle_dialog(accept=True)

await tab.on(PageEvent.JAVASCRIPT_DIALOG_OPENING, handle_dialog)
```

### Network Events

Monitor requests and responses:

```python
from pydoll.protocol.network.events import (
    NetworkEvent,
    RequestWillBeSentEvent,
    ResponseReceivedEvent,
    LoadingFailedEvent
)

await tab.enable_network_events()

# Track requests
async def log_request(event: RequestWillBeSentEvent):
    request = event['params']['request']
    print(f"→ {request['method']} {request['url']}")

await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, log_request)

# Track responses
async def log_response(event: ResponseReceivedEvent):
    response = event['params']['response']
    print(f"← {response['status']} {response['url']}")

await tab.on(NetworkEvent.RESPONSE_RECEIVED, log_response)

# Track failures
async def log_failure(event: LoadingFailedEvent):
    url = event['params']['type']
    error = event['params']['errorText']
    print(f"[FAILED] {url} - {error}")

await tab.on(NetworkEvent.LOADING_FAILED, log_failure)
```

### DOM Events

React to DOM changes:

```python
from pydoll.protocol.dom.events import DomEvent, AttributeModifiedEvent

await tab.enable_dom_events()

# Track attribute changes
async def on_attribute_change(event: AttributeModifiedEvent):
    node_id = event['params']['nodeId']
    attr_name = event['params']['name']
    attr_value = event['params']['value']
    print(f"Node {node_id}: {attr_name}={attr_value}")

await tab.on(DomEvent.ATTRIBUTE_MODIFIED, on_attribute_change)

# Track document updates
await tab.on(DomEvent.DOCUMENT_UPDATED, lambda e: print("Document updated!"))
```

## Temporary Callbacks

Use `temporary=True` for one-time listeners:

```python
from pydoll.protocol.page.events import PageEvent

# This will only fire once and then auto-remove
await tab.on(
    PageEvent.LOAD_EVENT_FIRED,
    lambda e: print("First load!"),
    temporary=True
)

await tab.go_to("https://example.com")  # Fires callback
await tab.refresh()                      # Callback won't fire again
```

!!! tip "Perfect for One-Time Setup"
    Temporary callbacks are ideal for initialization tasks that should only happen once.

## Accessing Tab in Callbacks

Use `functools.partial` to pass the tab to your callbacks:

```python
from functools import partial
from pydoll.protocol.network.events import NetworkEvent, ResponseReceivedEvent

async def process_response(tab, event: ResponseReceivedEvent):
    # Now we can use the tab object!
    request_id = event['params']['requestId']
    
    # Get response body
    body = await tab.get_network_response_body(request_id)
    print(f"Response body: {body[:100]}...")

await tab.enable_network_events()
await tab.on(
    NetworkEvent.RESPONSE_RECEIVED,
    partial(process_response, tab)
)
```

!!! info "Why Use Partial?"
    The event system only passes the event data to callbacks. `partial` lets you bind additional parameters like the tab instance.

## Managing Callbacks

### Removing Callbacks

```python
from pydoll.protocol.page.events import PageEvent

# Save the callback ID
callback_id = await tab.on(PageEvent.LOAD_EVENT_FIRED, my_callback)

# Remove it later
await tab.remove_callback(callback_id)
```

### Clearing All Callbacks

```python
# Remove all registered callbacks for this tab
await tab.clear_callbacks()
```

## Practical Examples

### Monitor API Calls

```python
import asyncio
from functools import partial
from pydoll.protocol.network.events import NetworkEvent, ResponseReceivedEvent

async def monitor_api_calls(tab):
    collected_data = []
    
    # Type hint helps IDE autocomplete event keys
    async def capture_api_response(tab, data_list, event: ResponseReceivedEvent):
        url = event['params']['response']['url']
        
        # Filter only API calls
        if '/api/' not in url:
            return
        
        request_id = event['params']['requestId']
        body = await tab.get_network_response_body(request_id)
        
        data_list.append({
            'url': url,
            'body': body,
            'status': event['params']['response']['status']
        })
        print(f"Captured API call: {url}")
    
    await tab.enable_network_events()
    await tab.on(
        NetworkEvent.RESPONSE_RECEIVED,
        partial(capture_api_response, tab, collected_data)
    )
    
    # Navigate and collect
    await tab.go_to("https://example.com")
    await asyncio.sleep(3)  # Wait for requests to complete
    
    return collected_data
```

### Wait for Specific Event

```python
import asyncio
from pydoll.protocol.page.events import PageEvent, FrameNavigatedEvent

async def wait_for_navigation():
    navigation_done = asyncio.Event()
    
    async def on_navigated(event: FrameNavigatedEvent):
        navigation_done.set()
    
    await tab.enable_page_events()
    await tab.on(PageEvent.FRAME_NAVIGATED, on_navigated, temporary=True)
    
    # Trigger navigation
    button = await tab.find(id='next-page')
    await button.click()
    
    # Wait for it to complete
    await navigation_done.wait()
    print("Navigation completed!")
```

### Network Idle Detection

```python
import asyncio
from pydoll.protocol.network.events import (
    NetworkEvent,
    RequestWillBeSentEvent,
    LoadingFinishedEvent,
    LoadingFailedEvent
)

async def wait_for_network_idle(tab, timeout=5):
    in_flight = 0
    idle_event = asyncio.Event()
    last_activity = asyncio.get_event_loop().time()
    
    async def on_request(event: RequestWillBeSentEvent):
        nonlocal in_flight, last_activity
        in_flight += 1
        last_activity = asyncio.get_event_loop().time()
    
    async def on_finished(event: LoadingFinishedEvent | LoadingFailedEvent):
        nonlocal in_flight, last_activity
        in_flight -= 1
        last_activity = asyncio.get_event_loop().time()
        
        if in_flight == 0:
            idle_event.set()
    
    await tab.enable_network_events()
    req_id = await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, on_request)
    fin_id = await tab.on(NetworkEvent.LOADING_FINISHED, on_finished)
    fail_id = await tab.on(NetworkEvent.LOADING_FAILED, on_finished)
    
    try:
        await asyncio.wait_for(idle_event.wait(), timeout=timeout)
        print("Network is idle!")
    except asyncio.TimeoutError:
        print(f"Network still active after {timeout}s")
    finally:
        # Cleanup
        await tab.remove_callback(req_id)
        await tab.remove_callback(fin_id)
        await tab.remove_callback(fail_id)
```

### Dynamic Content Scraping

```python
import asyncio
import json
from functools import partial
from pydoll.protocol.network.events import NetworkEvent, ResponseReceivedEvent

async def scrape_infinite_scroll(tab, max_items=100):
    items = []
    
    async def capture_products(tab, items_list, event: ResponseReceivedEvent):
        url = event['params']['response']['url']
        
        # Look for product API endpoint
        if '/products' not in url:
            return
        
        request_id = event['params']['requestId']
        body = await tab.get_network_response_body(request_id)
        
        try:
            data = json.loads(body)
            if 'items' in data:
                items_list.extend(data['items'])
                print(f"Collected {len(data['items'])} items (total: {len(items_list)})")
        except json.JSONDecodeError:
            pass
    
    await tab.enable_network_events()
    await tab.on(
        NetworkEvent.RESPONSE_RECEIVED,
        partial(capture_products, tab, items)
    )
    
    await tab.go_to("https://example.com/products")
    
    # Scroll to trigger infinite loading
    while len(items) < max_items:
        await tab.execute_script("window.scrollTo(0, document.body.scrollHeight)")
        await asyncio.sleep(1)
    
    return items[:max_items]
```

## Event Reference Tables

### Available Domains

| Domain | Enable Method | Common Use Cases |
|--------|--------------|------------------|
| Page | `enable_page_events()` | Page lifecycle, navigation, dialogs |
| Network | `enable_network_events()` | Request/response monitoring, API tracking |
| DOM | `enable_dom_events()` | DOM structure changes, attribute modifications |
| Fetch | `enable_fetch_events()` | Request interception and modification |
| Runtime | `enable_runtime_events()` | Console messages, JavaScript exceptions |

### Key Page Events

| Event | When It Fires | Use Case |
|-------|---------------|----------|
| `LOAD_EVENT_FIRED` | Page load complete | Wait for full page load |
| `DOM_CONTENT_EVENT_FIRED` | DOM ready | Start DOM manipulation |
| `JAVASCRIPT_DIALOG_OPENING` | Alert/confirm/prompt | Auto-handle dialogs |
| `FRAME_NAVIGATED` | Navigation complete | Track SPA navigation |
| `FILE_CHOOSER_OPENED` | File input clicked | Automated file uploads |

### Key Network Events

| Event | When It Fires | Use Case |
|-------|---------------|----------|
| `REQUEST_WILL_BE_SENT` | Before request sent | Log/modify outgoing requests |
| `RESPONSE_RECEIVED` | Response headers received | Capture API responses |
| `LOADING_FINISHED` | Response body loaded | Get full response data |
| `LOADING_FAILED` | Request failed | Track errors and retries |
| `WEB_SOCKET_CREATED` | WebSocket opened | Monitor real-time connections |

### Key DOM Events

| Event | When It Fires | Use Case |
|-------|---------------|----------|
| `DOCUMENT_UPDATED` | DOM rebuilt | Refresh element references |
| `ATTRIBUTE_MODIFIED` | Element attribute changed | Track dynamic attribute changes |
| `CHILD_NODE_INSERTED` | New element added | Detect dynamically added content |
| `CHILD_NODE_REMOVED` | Element removed | Detect removed content |

### Event Type Reference

All event types and their parameter structures are defined in the protocol modules:

| Domain | Import Path | Example Types |
|--------|-------------|---------------|
| Page | `pydoll.protocol.page.events` | `LoadEventFiredEvent`, `FrameNavigatedEvent`, `JavascriptDialogOpeningEvent` |
| Network | `pydoll.protocol.network.events` | `RequestWillBeSentEvent`, `ResponseReceivedEvent`, `LoadingFinishedEvent` |
| DOM | `pydoll.protocol.dom.events` | `DocumentUpdatedEvent`, `AttributeModifiedEvent`, `ChildNodeInsertedEvent` |
| Fetch | `pydoll.protocol.fetch.events` | `RequestPausedEvent`, `AuthRequiredEvent` |
| Runtime | `pydoll.protocol.runtime.events` | `ConsoleAPICalledEvent`, `ExceptionThrownEvent` |

Each event type is a `TypedDict` that defines the exact structure of the event, including all available keys in the `params` dictionary.

## Best Practices

### 1. Always Enable Domains First

```python
from pydoll.protocol.network.events import NetworkEvent

# Good
await tab.enable_network_events()
await tab.on(NetworkEvent.RESPONSE_RECEIVED, callback)

# Bad: callback will never fire
await tab.on(NetworkEvent.RESPONSE_RECEIVED, callback)
await tab.enable_network_events()
```

### 2. Clean Up When Done

```python
from pydoll.protocol.network.events import NetworkEvent

# Enable for specific task
await tab.enable_network_events()
callback_id = await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, log_request)

# Do your work...
await tab.go_to("https://example.com")

# Clean up
await tab.remove_callback(callback_id)
await tab.disable_network_events()
```

### 3. Use Early Filtering

```python
from pydoll.protocol.network.events import RequestWillBeSentEvent

# Good: filter early
async def handle_api_request(event: RequestWillBeSentEvent):
    url = event['params']['request']['url']
    if '/api/' not in url:
        return  # Exit early
    
    # Process only API requests
    process_request(event)

# Bad: processes everything
async def handle_all_requests(event: RequestWillBeSentEvent):
    url = event['params']['request']['url']
    process_request(event)
    if '/api/' in url:
        do_extra_work(event)
```

### 4. Handle Errors Gracefully

```python
from pydoll.protocol.network.events import ResponseReceivedEvent

async def safe_callback(event: ResponseReceivedEvent):
    try:
        request_id = event['params']['requestId']
        body = await tab.get_network_response_body(request_id)
        process_body(body)
    except KeyError:
        # Event might not have requestId
        pass
    except Exception as e:
        print(f"Error in callback: {e}")
        # Continue without breaking event loop
```

## Performance Considerations

!!! warning "High-Frequency Events"
    DOM events can fire **very frequently** on dynamic pages. Use filtering and debouncing to avoid performance issues.

### Event Volume by Domain

| Domain | Event Frequency | Performance Impact |
|--------|----------------|-------------------|
| Page | Low | Minimal |
| Network | Moderate-High | Moderate |
| DOM | Very High | High |
| Fetch | Moderate | Moderate |

### Optimization Tips

1. **Enable only what you need**: Don't enable all domains at once
2. **Use temporary callbacks**: Auto-cleanup when possible
3. **Filter early**: Check conditions before expensive operations
4. **Disable when done**: Free up resources
5. **Avoid heavy processing**: Keep callbacks fast, offload work to separate tasks

```python
import asyncio
from pydoll.protocol.network.events import ResponseReceivedEvent

# Good: fast callback, offload heavy work
async def handle_response(event: ResponseReceivedEvent):
    if should_process(event):
        asyncio.create_task(heavy_processing(event))  # Don't block

# Bad: blocks event loop
async def handle_response(event: ResponseReceivedEvent):
    await heavy_processing(event)  # Blocks other events
```

## Common Patterns

### Context Manager for Events

```python
from contextlib import asynccontextmanager
from pydoll.protocol.network.events import NetworkEvent, RequestWillBeSentEvent

@asynccontextmanager
async def monitor_requests(tab):
    """Context manager to monitor requests during a block."""
    requests = []
    
    async def capture(event: RequestWillBeSentEvent):
        requests.append(event['params']['request'])
    
    await tab.enable_network_events()
    cb_id = await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, capture)
    
    try:
        yield requests
    finally:
        await tab.remove_callback(cb_id)
        await tab.disable_network_events()

# Usage
async with monitor_requests(tab) as requests:
    await tab.go_to("https://example.com")
    # All requests are captured

print(f"Captured {len(requests)} requests")
```

### Conditional Event Registration

```python
from pydoll.protocol.network.events import NetworkEvent
from pydoll.protocol.dom.events import DomEvent

async def setup_monitoring(tab, track_network=False, track_dom=False):
    """Enable only specified monitoring."""
    callbacks = []
    
    if track_network:
        await tab.enable_network_events()
        cb = await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, log_request)
        callbacks.append(('network', cb))
    
    if track_dom:
        await tab.enable_dom_events()
        cb = await tab.on(DomEvent.ATTRIBUTE_MODIFIED, log_dom_change)
        callbacks.append(('dom', cb))
    
    return callbacks
```

## Further Reading

- **[Event Architecture Deep Dive](../../deep-dive/event-architecture.md)** - Internal implementation and WebSocket communication
- **[Network Monitoring](../network/monitoring.md)** - Advanced network analysis techniques
- **[Reactive Automation](reactive-automation.md)** - Building event-driven workflows

!!! tip "Start Simple"
    Begin with Page events to understand the basics, then move to Network and DOM events as needed. The event system is powerful but can be overwhelming at first.


================================================
FILE: docs/en/features/advanced/remote-connections.md
================================================
# Remote Connections & Hybrid Automation

Pydoll allows you to connect to already-running browsers via WebSocket, enabling remote control and hybrid automation scenarios. This is perfect for CI/CD pipelines, containerized environments, debugging sessions, and integrating Pydoll with existing CDP tooling.

!!! info "Zero Setup Required"
    Unlike traditional automation that launches browsers, remote connections let you control browsers that are already running. No process management needed!

## Why Remote Connections?

Remote connections unlock powerful automation scenarios:

| Use Case | Benefit |
|----------|---------|
| **CI/CD Pipelines** | Connect to browser containers without managing processes |
| **Docker Environments** | Control browsers running in separate containers |
| **Remote Debugging** | Automate browsers on remote servers or VMs |
| **Hybrid Tooling** | Integrate Pydoll with your existing CDP infrastructure |
| **Development** | Attach to your local browser for quick testing |
| **Multi-Tool Automation** | Share browser sessions between different tools |

## Setting Up a Remote Browser Server

!!! tip "Already Have a Remote Browser Service?"
    If you're using a cloud browser service (BrowserStack, Selenium Grid, LambdaTest, etc.) or already have a Chrome instance running with a WebSocket URL, you can **skip this entire section** and jump directly to [Connection Methods](#connection-methods) to learn how to connect with Pydoll.

Before you can connect remotely, you need to start Chrome with debugging enabled and properly configured to accept external connections.

### Basic Server Setup (Linux)

Start Chrome with remote debugging on a server:

```bash
# Basic setup - only accessible from localhost
google-chrome \
  --remote-debugging-port=9222 \
  --headless=new \
  --no-sandbox \
  --disable-dev-shm-usage \
  --user-data-dir=/tmp/chrome-profile

# Server setup - accessible from other machines
google-chrome \
  --remote-debugging-port=9222 \
  --remote-debugging-address=0.0.0.0 \
  --headless=new \
  --no-sandbox \
  --disable-dev-shm-usage \
  --user-data-dir=/tmp/chrome-profile
```

!!! warning "Security Critical"
    Using `--remote-debugging-address=0.0.0.0` makes the debugging port accessible from **any network interface**. This is necessary for remote connections but creates a significant security risk if exposed to the internet.

### Recommended Server Configuration

```bash
# Production-ready configuration
google-chrome \
  --remote-debugging-port=9222 \
  --remote-debugging-address=0.0.0.0 \
  --headless=new \
  --no-sandbox \
  --disable-dev-shm-usage \
  --disable-gpu \
  --disable-software-rasterizer \
  --disable-extensions \
  --disable-background-networking \
  --disable-background-timer-throttling \
  --disable-client-side-phishing-detection \
  --disable-popup-blocking \
  --disable-prompt-on-repost \
  --disable-sync \
  --metrics-recording-only \
  --no-first-run \
  --safebrowsing-disable-auto-update \
  --user-data-dir=/tmp/chrome-remote-$(date +%s)
```

**Key flags explained:**

| Flag | Purpose |
|------|---------|
| `--remote-debugging-port=9222` | Enable CDP on port 9222 |
| `--remote-debugging-address=0.0.0.0` | Allow external connections (security risk!) |
| `--headless=new` | Run without GUI (server mode) |
| `--no-sandbox` | Required in Docker/containers (security tradeoff) |
| `--disable-dev-shm-usage` | Prevent /dev/shm memory issues in containers |
| `--disable-gpu` | No GPU acceleration (recommended for headless) |
| `--user-data-dir=/tmp/...` | Isolated profile per instance |

!!! warning "About --no-sandbox Flag"
    The `--no-sandbox` flag disables Chrome's security sandbox, which isolates the browser process from the system. This flag is **required** in most Docker/container environments due to kernel capability restrictions, but it comes with security implications:
    
    - **Risk**: Removes isolation between browser and system
    - **When to use**: Docker containers, restricted environments
    - **Mitigation**: Ensure container-level isolation (namespaces, cgroups) and avoid running as root
    
    Consider using `--no-sandbox` only when absolutely necessary and implement additional security layers at the container level.

### Docker Setup

Create a containerized Chrome server:

!!! tip "Using Pre-built Images"
    For production, consider using official pre-built images instead of building your own:
    
    - **Selenium Images**: `selenium/standalone-chrome` (includes WebDriver)
    - **Zenika Alpine Chrome**: `zenika/alpine-chrome` (lightweight, ~200MB)
    - **Browserless**: `browserless/chrome` (production-ready with monitoring)
    
    These images are regularly updated, security-tested, and optimized for container environments.

**Dockerfile (Custom Build):**
```dockerfile
FROM ubuntu:22.04

# Install Chrome
RUN apt-get update && apt-get install -y \
    wget \
    gnupg \
    ca-certificates \
    && wget -q -O - https://dl.google.com/linux/linux_signing_key.pub | apt-key add - \
    && echo "deb [arch=amd64] http://dl.google.com/linux/chrome/deb/ stable main" >> /etc/apt/sources.list.d/google.list \
    && apt-get update \
    && apt-get install -y google-chrome-stable \
    && rm -rf /var/lib/apt/lists/*

# Expose debugging port
EXPOSE 9222

# Start Chrome with remote debugging
CMD ["google-chrome", \
     "--remote-debugging-port=9222", \
     "--remote-debugging-address=0.0.0.0", \
     "--headless=new", \
     "--no-sandbox", \
     "--disable-dev-shm-usage", \
     "--disable-gpu", \
     "--user-data-dir=/tmp/chrome-profile"]
```

**docker-compose.yml:**
```yaml
services:
  chrome-server:
    build: .
    ports:
      - "127.0.0.1:9222:9222"
    
    # Uncomment the line below ONLY if you need remote access 
    # AND have secured the port with a firewall or proxy.
    # - "9222:9222"

    shm_size: '2gb'  # Critical: Chrome uses /dev/shm for shared memory
                      # Default Docker shm_size (64MB) is insufficient
    restart: unless-stopped
    environment:
      - DISPLAY=:99
    networks:
      - automation-network
    # Optional: Resource limits for production
    # deploy:
    #   resources:
    #     limits:
    #       cpus: '2'
    #       memory: 4G

  automation-client:
    image: python:3.11
    depends_on:
      - chrome-server
    volumes:
      - ./:/app
    working_dir: /app
    command: python automation_script.py
    environment:
      - CHROME_WS=ws://chrome-server:9222/devtools/browser
    networks:
      - automation-network

networks:
  automation-network:
    driver: bridge
```

**Usage:**
```bash
# Start the stack
docker-compose up -d

# Check Chrome is running
curl http://localhost:9222/json/version

# Connect from automation client (inside Docker network)
# ws://chrome-server:9222/devtools/browser/...
```

### Systemd Service (Linux Server)

Create a persistent Chrome service:

**/etc/systemd/system/chrome-remote.service:**
```ini
[Unit]
Description=Chrome Remote Debugging Server
After=network.target

[Service]
Type=simple
User=chrome-user
Group=chrome-user
Environment="DISPLAY=:99"
ExecStart=/usr/bin/google-chrome \
    --remote-debugging-port=9222 \
    --remote-debugging-address=0.0.0.0 \
    --headless=new \
    --no-sandbox \
    --disable-dev-shm-usage \
    --disable-gpu \
    --user-data-dir=/var/lib/chrome-remote
Restart=always
RestartSec=10

[Install]
WantedBy=multi-user.target
```

**Setup and management:**
```bash
# Create dedicated user
sudo useradd -r -s /bin/false chrome-user
sudo mkdir -p /var/lib/chrome-remote
sudo chown chrome-user:chrome-user /var/lib/chrome-remote

# Install and enable service
sudo systemctl daemon-reload
sudo systemctl enable chrome-remote
sudo systemctl start chrome-remote

# Check status
sudo systemctl status chrome-remote

# View logs
sudo journalctl -u chrome-remote -f

# Restart service
sudo systemctl restart chrome-remote
```

### Network Security Configuration

#### Firewall Rules (iptables)

```bash
# Allow only specific IPs to access port 9222
sudo iptables -A INPUT -p tcp --dport 9222 -s 192.168.1.100 -j ACCEPT
sudo iptables -A INPUT -p tcp --dport 9222 -j DROP

# Save rules
sudo iptables-save > /etc/iptables/rules.v4
```

#### Firewall Rules (ufw)

```bash
# Deny all access to port 9222 by default
sudo ufw deny 9222

# Allow specific IP
sudo ufw allow from 192.168.1.100 to any port 9222

# Allow specific subnet
sudo ufw allow from 192.168.1.0/24 to any port 9222

# Enable firewall
sudo ufw enable
```

#### Nginx Reverse Proxy (with Authentication)

Protect Chrome debugging with HTTP authentication:

**/etc/nginx/sites-available/chrome-remote:**
```nginx
server {
    listen 80;
    server_name chrome.example.com;

    # Basic authentication
    auth_basic "Chrome Remote Debugging";
    auth_basic_user_file /etc/nginx/.htpasswd;

    location / {
        proxy_pass http://localhost:9222;
        proxy_http_version 1.1;
        proxy_set_header Upgrade $http_upgrade;
        proxy_set_header Connection "upgrade";
        proxy_set_header Host $host;
        proxy_set_header X-Real-IP $remote_addr;
        proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
        proxy_read_timeout 86400;
    }
}
```

**Setup:**
```bash
# Create password file
sudo htpasswd -c /etc/nginx/.htpasswd admin

# Enable site
sudo ln -s /etc/nginx/sites-available/chrome-remote /etc/nginx/sites-enabled/
sudo nginx -t
sudo systemctl reload nginx

# Connect with authentication
# ws://admin:password@chrome.example.com/devtools/browser/...
```

### Connecting from Another Computer

Once your server is configured, connect from your client machine:

```python
import asyncio
import aiohttp
from pydoll.browser.chromium import Chrome

async def connect_to_remote_server():
    """Connect to Chrome running on a remote server."""
    # Server IP and port
    server_ip = "192.168.1.100"
    server_port = 9222

    async with aiohttp.ClientSession() as session:
        # Query the server for available targets
        url = f"http://{server_ip}:{server_port}/json/version"
        
        async with session.get(url) as response:
            data = await response.json()
            ws_url = data['webSocketDebuggerUrl']
            
            print(f"Server info:")
            print(f"  Browser: {data.get('Browser')}")
            print(f"  Protocol: {data.get('Protocol-Version')}")
            print(f"  WebSocket: {ws_url}")
    
    # 2. Connect to the browser
    chrome = Chrome()
    tab = await chrome.connect(ws_url)
    
    print(f"\n[SUCCESS] Connected to remote Chrome server!")
    
    # 3. Use normally
    await tab.go_to('https://example.com')
    title = await tab.execute_script('return document.title')
    print(f"Page title: {title}")
    
    # 4. Cleanup
    await chrome.close()

asyncio.run(connect_to_remote_server())
```

### Testing Your Server Setup

```bash
# 1. Check if Chrome is running
ps aux | grep chrome

# 2. Check if port is listening
netstat -tulpn | grep 9222
# Or
ss -tulpn | grep 9222

# 3. Test local access
curl http://localhost:9222/json/version

# 4. Test remote access (from client machine)
curl http://SERVER_IP:9222/json/version

# 5. Check WebSocket URL
curl http://SERVER_IP:9222/json/version | jq -r '.webSocketDebuggerUrl'

# 6. List all available targets (tabs/pages)
curl http://SERVER_IP:9222/json/list
```

### Multi-Instance Setup

Run multiple Chrome instances on different ports:

```bash
#!/bin/bash
# start-chrome-pool.sh

for port in 9222 9223 9224 9225; do
    google-chrome \
        --remote-debugging-port=$port \
        --remote-debugging-address=0.0.0.0 \
        --headless=new \
        --no-sandbox \
        --disable-dev-shm-usage \
        --user-data-dir=/tmp/chrome-$port &
    
    echo "Started Chrome on port $port"
done

echo "Chrome pool ready. Ports: 9222-9225"
```

**Python client with pool:**
```python
import asyncio
from pydoll.browser.chromium import Chrome
import aiohttp

async def connect_to_pool(server_ip: str, ports: list[int]):
    """Connect to multiple Chrome instances."""
    tasks = []
    
    for port in ports:
        task = connect_to_instance(server_ip, port)
        tasks.append(task)
    
    results = await asyncio.gather(*tasks)
    return results

async def connect_to_instance(server_ip: str, port: int):
    """Connect to a single Chrome instance."""
    # Get WebSocket URL
    async with aiohttp.ClientSession() as session:
        url = f"http://{server_ip}:{port}/json/version"
        async with session.get(url) as response:
            data = await response.json()
            ws_url = data['webSocketDebuggerUrl']
    
    # Connect
    chrome = Chrome()
    tab = await chrome.connect(ws_url)
    
    # Run automation
    await tab.go_to('https://example.com')
    title = await tab.execute_script('return document.title')
    
    print(f"Port {port}: {title}")
    
    await chrome.close()
    return title

# Usage
asyncio.run(connect_to_pool('192.168.1.100', [9222, 9223, 9224, 9225]))
```

## Connection Methods

Pydoll provides two approaches for remote connections, each suited for different scenarios.

### Method 1: Browser-Level Connection

Connect to a running browser using its WebSocket endpoint and get access to all opened tabs:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def connect_to_remote_browser():
    chrome = Chrome()
    
    # Connect to remote browser via WebSocket
    tab = await chrome.connect('ws://localhost:9222/devtools/browser/XXXX')
    
    # The tab returned is the first available tab
    print(f"Connected to tab: {await tab.execute_script('return document.title')}")
    
    # You can get all other tabs too
    all_tabs = await chrome.get_opened_tabs()
    print(f"Total tabs available: {len(all_tabs)}")
    
    # Use the tab normally
    await tab.go_to('https://example.com')
    element = await tab.find(id='main-content')
    text = await element.text
    print(f"Content: {text}")
    
    # Cleanup
    await chrome.close()

asyncio.run(connect_to_remote_browser())
```

!!! tip "Getting the WebSocket URL"
    Start Chrome with debugging enabled:
    ```bash
    # Linux/Mac
    google-chrome --remote-debugging-port=9222
    
    # Windows
    "C:\Program Files\Google\Chrome\Application\chrome.exe" --remote-debugging-port=9222
    ```
    
    **For local connections** (same machine):
    
    - Visit `http://localhost:9222/json/version` in your browser to get the WebSocket URL in the `webSocketDebuggerUrl` field
    - Or programmatically query it as shown in the example above using `aiohttp`
    - For quick debugging, you can also check `browser._connection_port` after starting a local browser instance
    
    **For remote connections** (different machine):
    
    - Query `http://SERVER_IP:9222/json/version` from your client machine
    - Use the `webSocketDebuggerUrl` from the response, replacing `localhost` with the actual server IP if needed

### Method 2: Direct Element Control (Hybrid Approach)

If you already have your own CDP integration or low-level tooling, you can wrap existing elements with Pydoll's high-level API:

```python
import asyncio
import json
from pydoll.connection.connection_handler import ConnectionHandler
from pydoll.elements.web_element import WebElement

async def custom_cdp_integration():
    """Use Pydoll alongside your custom CDP implementation."""
    # Your existing CDP setup has found an element
    page_ws = 'ws://localhost:9222/devtools/page/ABC123'
    
    # You've used Runtime.evaluate to find an element
    # and got its objectId
    element_object_id = '{\"injectedScriptId\":1,\"id\":1}'
    
    # Create Pydoll connection
    connection = ConnectionHandler(ws_address=page_ws)
    
    # Wrap the element
    button = WebElement(
        object_id=element_object_id,
        connection_handler=connection
    )
    
    # Use Pydoll's high-level methods
    await button.wait_until(is_visible=True, timeout=5)
    await button.wait_until(is_interactable=True)
    
    # Click with realistic offset
    await button.click(offset_x=5, offset_y=5)
    
    # Get computed properties easily
    is_enabled = await button.is_enabled()
    bounds = await button.bounds
    
    print(f"Button clicked! Enabled: {is_enabled}, Bounds: {bounds}")
    
    # Cleanup
    await connection.close()

asyncio.run(custom_cdp_integration())
```

!!! tip "Object ID Format"
    The `objectId` is a string returned by CDP commands like `Runtime.evaluate` or `DOM.resolveNode`. It's usually a JSON string with fields like `injectedScriptId` and `id`.


!!! info "Best of Both Worlds"
    This hybrid approach lets you leverage your existing CDP infrastructure while benefiting from Pydoll's ergonomic element API for interactions, waits, and property access.

## Security Considerations

!!! danger "Production Environments"
    Remote debugging ports expose **full control** over the browser, including:
    
    - Access to all pages and data
    - Ability to execute arbitrary JavaScript
    - Cookie and session access
    - File system access via downloads
    
    **Never expose debugging ports to the internet without proper authentication and network security!**

### Recommended Security Practices

| Practice | Why | How |
|----------|-----|-----|
| **SSH Tunnels** | Encrypt traffic and authenticate | `ssh -L 9222:localhost:9222 user@host` |
| **VPN** | Network-level security | Connect via corporate/private VPN |
| **Firewall Rules** | Restrict access | Allow only specific IPs |
| **Docker Networks** | Container isolation | Use private Docker networks |
| **No Public Exposure** | Prevent attacks | Never bind to `0.0.0.0` in production |

## Further Reading

- **[Event System](event-system.md)** - Monitor remote browser events
- **[Network Monitoring](../network/monitoring.md)** - Track requests in remote browsers
- **[Browser Options](../configuration/browser-options.md)** - Configure local browsers before starting

!!! tip "Start Local, Scale Remote"
    Develop your automation locally with `browser.start()` for quick iterations, then deploy with `browser.connect()` for production CI/CD pipelines and containerized environments.


================================================
FILE: docs/en/features/automation/file-operations.md
================================================
# File Operations

File uploads are one of the most challenging aspects of browser automation. Traditional tools often struggle with OS-level file dialogs, requiring complex workarounds or external libraries. Pydoll provides two straightforward approaches for handling file uploads, each suited for different scenarios.

## Upload Methods

Pydoll supports two primary methods for file uploads:

1. **Direct file input** (`set_input_files()`): Fast and direct, works with `<input type="file">` elements
2. **File chooser context manager** (`expect_file_chooser()`): Intercepts the file dialog, works with any upload trigger

## Direct File Input

The simplest approach is using `set_input_files()` directly on file input elements. This method is fast, reliable, and bypasses the OS file dialog entirely.

### Basic Usage

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def direct_file_upload():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/upload')
        
        # Find the file input element
        file_input = await tab.find(tag_name='input', type='file')
        
        # Set the file directly
        file_path = Path('path/to/document.pdf')
        await file_input.set_input_files(file_path)
        
        # Submit the form
        submit_button = await tab.find(id='submit-button')
        await submit_button.click()
        
        print("File uploaded successfully!")

asyncio.run(direct_file_upload())
```

!!! tip "Path vs String"
    While `Path` objects from `pathlib` are recommended as best practice for better path handling and cross-platform compatibility, you can also use plain strings if preferred:
    ```python
    await file_input.set_input_files('path/to/document.pdf')  # Also works!
    ```

### Multiple Files

For inputs that accept multiple files (`<input type="file" multiple>`), pass a list of file paths:

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def upload_multiple_files():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/multi-upload')
        
        file_input = await tab.find(tag_name='input', type='file')
        
        # Upload multiple files at once
        files = [
            Path('documents/report.pdf'),
            Path('images/screenshot.png'),
            Path('data/results.csv')
        ]
        await file_input.set_input_files(files)
        
        # Process as normal
        upload_btn = await tab.find(id='upload-btn')
        await upload_btn.click()

asyncio.run(upload_multiple_files())
```

### Dynamic Path Resolution

`Path` objects make it easy to build paths dynamically and handle cross-platform compatibility:

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def upload_with_dynamic_paths():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/upload')
        
        file_input = await tab.find(tag_name='input', type='file')
        
        # Build paths dynamically
        project_dir = Path(__file__).parent
        file_path = project_dir / 'uploads' / 'data.json'

        await file_input.set_input_files(file_path)
        # Or use home directory
        user_file = Path.home() / 'Documents' / 'report.pdf'
        await file_input.set_input_files(user_file)

asyncio.run(upload_with_dynamic_paths())
```

!!! tip "When to Use Direct File Input"
    Use `set_input_files()` when:
    
    - The file input is directly accessible in the DOM
    - You want maximum speed and simplicity
    - The upload doesn't trigger a file chooser dialog
    - You're working with standard `<input type="file">` elements

## File Chooser Context Manager

Some websites hide the file input and use custom buttons or drag-and-drop areas that trigger the OS file chooser dialog. For these cases, use the `expect_file_chooser()` context manager.

### How It Works

The `expect_file_chooser()` context manager:

1. Enables file chooser interception
2. Waits for the file chooser dialog to open
3. Automatically sets the files when the dialog appears
4. Cleans up after the operation completes

### Basic Usage

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def file_chooser_upload():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/custom-upload')
        
        # Prepare the file path
        file_path = Path.cwd() / 'document.pdf'
        
        # Use context manager to handle file chooser
        async with tab.expect_file_chooser(files=file_path):
            # Click the custom upload button
            upload_button = await tab.find(class_name='custom-upload-btn')
            await upload_button.click()
            # File is automatically set when dialog opens
        
        # Continue with your automation
        print("File selected via chooser!")

asyncio.run(file_chooser_upload())
```

### Multiple Files with File Chooser

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def multiple_files_chooser():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/gallery-upload')
        
        # Prepare multiple files
        photos_dir = Path.home() / 'photos'
        files = [
            photos_dir / 'img1.jpg',
            photos_dir / 'img2.jpg',
            photos_dir / 'img3.jpg'
        ]
        
        async with tab.expect_file_chooser(files=files):
            # Trigger upload via custom button
            add_photos_btn = await tab.find(text='Add Photos')
            await add_photos_btn.click()
        
        print(f"{len(files)} files selected!")

asyncio.run(multiple_files_chooser())
```

### Dynamic File Selection

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def dynamic_file_selection():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/batch-upload')
        
        # Find all CSV files in a directory using Path.glob()
        data_dir = Path('data')
        csv_files = list(data_dir.glob('*.csv'))
        
        async with tab.expect_file_chooser(files=csv_files):
            upload_area = await tab.find(class_name='drop-zone')
            await upload_area.click()
        
        print(f"Selected {len(csv_files)} CSV files")

asyncio.run(dynamic_file_selection())
```

!!! tip "When to Use File Chooser"
    Use `expect_file_chooser()` when:
    
    - The file input is hidden or not directly accessible
    - Custom buttons trigger the file chooser dialog
    - Working with drag-and-drop upload areas
    - The site uses JavaScript to open file dialogs

## Comparison: Direct vs File Chooser

| Feature | `set_input_files()` | `expect_file_chooser()` |
|---------|---------------------|-------------------------|
| **Speed** | ⚡ Instant | 🕐 Waits for dialog |
| **Complexity** | Simple | Requires context manager |
| **Requirements** | Visible file input | Any upload trigger |
| **Use Case** | Standard forms | Custom upload UIs |
| **Event Handling** | Not needed | Uses page events |

## Complete Example

Here's a comprehensive example combining both approaches:

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def comprehensive_upload_example():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/upload-form')
        
        # Scenario 1: Direct input for profile picture (single file)
        avatar_input = await tab.find(id='avatar-upload')
        avatar_path = Path.home() / 'Pictures' / 'profile.jpg'
        await avatar_input.set_input_files(avatar_path)
        
        # Wait a bit for preview to load
        await asyncio.sleep(1)
        
        # Scenario 2: File chooser for document upload
        document_path = Path.cwd() / 'documents' / 'resume.pdf'
        async with tab.expect_file_chooser(files=document_path):
            # Custom styled button that triggers file chooser
            upload_btn = await tab.find(class_name='btn-upload-document')
            await upload_btn.click()
        
        # Wait for upload confirmation
        await asyncio.sleep(2)
        
        # Scenario 3: Multiple files via file chooser
        certs_dir = Path('certs')
        certificates = [
            certs_dir / 'certificate1.pdf',
            certs_dir / 'certificate2.pdf',
            certs_dir / 'certificate3.pdf'
        ]
        async with tab.expect_file_chooser(files=certificates):
            add_certs_btn = await tab.find(text='Add Certificates')
            await add_certs_btn.click()
        
        # Submit the complete form
        submit_button = await tab.find(type='submit')
        await submit_button.click()
        
        # Wait for success message
        success_msg = await tab.find(class_name='success-message', timeout=10)
        message_text = await success_msg.text
        print(f"Upload result: {message_text}")

asyncio.run(comprehensive_upload_example())
```

!!! info "Method Summary"
    This example demonstrates the flexibility of Pydoll's file upload system:
    
    - **Single files**: Pass `Path` or `str` directly (no list needed)
    - **Multiple files**: Pass a list of `Path` or `str` objects
    - **Direct input**: Fast for visible `<input>` elements
    - **File chooser**: Works with custom upload buttons and hidden inputs

## Learn More

For deeper understanding of the file upload mechanisms:

- **[Event System](../advanced/event-system.md)**: Learn about the page events used by `expect_file_chooser()`
- **[Deep Dive: Tab Domain](../../deep-dive/tab-domain.md#file-chooser-handling)**: Technical details on file chooser interception
- **[Deep Dive: Event System](../../deep-dive/event-system.md#file-chooser-events)**: How file chooser events work under the hood

File operations in Pydoll eliminate one of the biggest pain points in browser automation, providing clean, reliable methods for both simple and complex upload scenarios.


================================================
FILE: docs/en/features/automation/human-interactions.md
================================================
# Human-Like Interactions

One of the key differentiators between successful automation and easily-detected bots is how realistic the interactions are. Pydoll provides sophisticated tools to make your automation virtually indistinguishable from human behavior.

!!! info "Feature Status"
    **Already Implemented:**

    - **Humanized Keyboard**: Variable typing speed, realistic typos with auto-correction (pass `humanize=True`)
    - **Humanized Scroll**: Physics-based scrolling with momentum, friction, jitter, and overshoot (pass `humanize=True`)
    - **Humanized Mouse**: Bezier curve paths, Fitts's Law timing, minimum-jerk velocity, tremor, and overshoot (pass `humanize=True`)

    **Coming Soon:**

    - **Automatic random click offsets**: Optional parameter to automatically randomize click positions within elements
    - **Hover behavior**: Realistic delays and movement when hovering over elements

## Why Human-Like Interactions Matter

Modern websites employ sophisticated bot detection techniques:

- **Event timing analysis**: Detecting impossibly fast or perfectly timed actions
- **Mouse movement tracking**: Identifying straight-line movements or instant teleportation
- **Keyboard patterns**: Spotting instant text insertion without individual keystrokes
- **Click positions**: Detecting clicks always at exact center of elements
- **Action sequences**: Identifying non-human patterns in user behavior

Pydoll helps you avoid detection by providing realistic interaction methods that mimic real user behavior.

## Realistic Mouse Movement

The Mouse API (`tab.mouse`) provides humanized cursor control with multiple layers of realism. When `humanize=True`, mouse movements follow natural Bezier curve paths with Fitts's Law timing, minimum-jerk velocity profiles, physiological tremor, and overshoot correction.

```python
from pydoll.browser.chromium import Chrome

async with Chrome() as browser:
    tab = await browser.start()
    await tab.go_to('https://example.com')

    # Move with natural curved path
    await tab.mouse.move(500, 300, humanize=True)

    # Click with realistic movement, offset, and timing
    await tab.mouse.click(500, 300, humanize=True)

    # Drag with natural movement
    await tab.mouse.drag(100, 200, 500, 400, humanize=True)
```

Key techniques applied during humanized mouse operations:

- **Bezier curve paths**: Curved trajectories with asymmetric control points (more curvature early in the movement)
- **Fitts's Law timing**: Movement duration scales with distance: `MT = a + b × log₂(D/W + 1)`
- **Minimum-jerk velocity**: Bell-shaped speed profile, slow start, peak in the middle, slow end
- **Physiological tremor**: Gaussian noise (σ ≈ 1px) scaled inversely with velocity
- **Overshoot and correction**: ~70% chance of overshooting fast movements by 3–12%, then correcting back
!!! info "Dedicated Mouse Control Documentation"
    For comprehensive mouse control documentation, including all methods, custom timing configuration, position tracking, and debug mode, see **[Mouse Control](mouse-control.md)**.

## Realistic Clicking

### Basic Click with Simulated Mouse Events

The `click()` method simulates real mouse press and release events, unlike JavaScript-based clicking:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def realistic_clicking():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        button = await tab.find(id="submit-button")
        
        # Basic realistic click
        await button.click()
        
        # The click includes:
        # - Mouse move to element
        # - Mouse press event
        # - Configurable hold time
        # - Mouse release event

asyncio.run(realistic_clicking())
```

### Click with Position Offset

Real users rarely click at the exact center of elements. Use offsets to vary click positions:

!!! info "Current State: Manual Offset Calculation"
    Currently, you must manually calculate and randomize click offsets for each interaction. Future versions will include an optional parameter to automatically randomize click positions within element bounds.

```python
import asyncio
import random
from pydoll.browser.chromium import Chrome

async def click_with_offset():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/form')
        
        submit_button = await tab.find(tag_name="button", type="submit")
        
        # Click slightly off-center (more natural)
        await submit_button.click(
            x_offset=5,   # 5 pixels right of center
            y_offset=-3   # 3 pixels above center
        )
        
        # Currently: Manually vary the offset for each click to appear more human
        for item in await tab.find(class_name="clickable-item", find_all=True):
            offset_x = random.randint(-10, 10)
            offset_y = random.randint(-10, 10)
            await item.click(x_offset=offset_x, y_offset=offset_y)
            await asyncio.sleep(random.uniform(0.5, 2.0))

asyncio.run(click_with_offset())
```

### Adjustable Click Hold Time

Vary the duration of mouse button press to simulate different click styles:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def variable_hold_time():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        button = await tab.find(class_name="action-button")
        
        # Quick click (default is 0.1s)
        await button.click(hold_time=0.05)
        
        # Normal click
        await button.click(hold_time=0.1)
        
        # Slower, more deliberate click
        await button.click(hold_time=0.2)
        
        # Simulate user hesitation
        await asyncio.sleep(0.8)
        await button.click(hold_time=0.15)

asyncio.run(variable_hold_time())
```

### When to Use click() vs click_using_js()

Understanding the difference is crucial for avoiding detection:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def click_methods_comparison():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        button = await tab.find(id="interactive-button")
        
        # Method 1: click() - Simulates real mouse events
        # ✅ Triggers all mouse events (mousedown, mouseup, click)
        # ✅ Respects element positioning
        # ✅ More realistic and harder to detect
        # ❌ Requires element to be visible and in viewport
        await button.click()
        
        # Method 2: click_using_js() - Uses JavaScript click()
        # ✅ Works on hidden elements
        # ✅ Faster execution
        # ✅ Bypasses visual overlays
        # ❌ May be detected as automation
        # ❌ Doesn't trigger same event sequence as real user
        await button.click_using_js()

asyncio.run(click_methods_comparison())
```

!!! tip "Best Practice: Prefer Mouse Events"
    Use `click()` for user-facing interactions to maintain realism. Reserve `click_using_js()` for backend operations, hidden elements, or when speed is critical and detection isn't a concern.

## Realistic Text Input

Pydoll's keyboard API provides two typing modes to balance speed and stealth.

!!! info "Understanding Typing Modes"
    | Mode | Parameters | Behavior | Use Case |
    |------|------------|----------|----------|
    | **Default (Fast)** | `humanize=False` | Fixed 50ms intervals, no typos | Speed-critical, low-risk scenarios (default) |
    | **Humanized** | `humanize=True` | Variable timing, ~2% typo rate with auto-correction | **Anti-bot evasion** |

    The `interval` parameter is deprecated. Pass `humanize=True` for realistic typing.

### Natural Typing with Humanization

When `humanize=True` is passed, `type_text()` uses humanized mode, simulating realistic human typing with variable speeds and occasional typos that are automatically corrected:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def natural_typing():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/login')
        
        username_field = await tab.find(id="username")
        password_field = await tab.find(id="password")

        # Variable speed: 30-120ms between keystrokes
        # ~2% typo rate with realistic correction behavior
        await username_field.type_text("john.doe@example.com", humanize=True)
        await password_field.type_text("MyC0mpl3xP@ssw0rd!", humanize=True)

asyncio.run(natural_typing())
```

### Fast Input for Non-Visible Fields

For fields that don't require realism (like hidden fields or backend operations), use `insert_text()`:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def fast_vs_realistic_input():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/form')
        
        username = await tab.find(id="username")
        await username.click()
        await username.type_text("john_doe", humanize=True)
        
        hidden_field = await tab.find(id="hidden-token")
        await hidden_field.insert_text("very-long-generated-token-12345678")
        
        comment = await tab.find(id="comment-box")
        await comment.click()
        await comment.type_text("This looks like human input!", humanize=True)

asyncio.run(fast_vs_realistic_input())
```

!!! info "Advanced Keyboard Control"
    For comprehensive keyboard control documentation, including special keys, key combinations, modifiers, and complete key reference tables, see **[Keyboard Control](keyboard-control.md)**.

## Realistic Page Scrolling

Pydoll provides a dedicated scroll API that waits for scroll completion before proceeding, making your automations more realistic and reliable.

!!! info "Understanding Scroll Modes"
    Pydoll's scroll API offers **three distinct modes**:

    | Mode | Parameters | Behavior | Use Case |
    |------|------------|----------|----------|
    | **Smooth (Default)** | `smooth=True` | CSS-based animation, predictable | General browsing simulation (default) |
    | **Humanized** | `humanize=True` | Physics engine with momentum, jitter, overshoot | **Anti-bot evasion** |
    | **Instant** | `smooth=False` | Teleports to position immediately | Speed-critical operations |

    Pass `humanize=True` for physics-based humanized scrolling to evade bot detection.

### Basic Directional Scrolling

Use the `scroll.by()` method to scroll the page in any direction with precise control:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.constants import ScrollPosition

async def basic_scrolling():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/long-page')
        
        # Humanized - physics engine with Bezier curves
        # Includes: momentum, friction, jitter, micro-pauses, overshoot
        await tab.scroll.by(ScrollPosition.DOWN, 500, humanize=True)
        await tab.scroll.by(ScrollPosition.UP, 300, humanize=True)

        # CSS-based animation - looks nice but predictable timing
        await tab.scroll.by(ScrollPosition.DOWN, 500, humanize=False, smooth=True)

        # Teleports instantly - fastest but easily detectable
        await tab.scroll.by(ScrollPosition.DOWN, 1000, humanize=False, smooth=False)

asyncio.run(basic_scrolling())
```

### Scrolling to Specific Positions

Navigate to the top or bottom of the page with control over realism:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def scroll_to_positions():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/article')
        
        # Read the beginning of the article
        await asyncio.sleep(2.0)
        
        # Humanized scroll (physics engine, anti-bot evasion)
        await tab.scroll.to_bottom(humanize=True)
        await asyncio.sleep(1.5)
        await tab.scroll.to_top(humanize=True)

        # CSS smooth scroll (predictable animation)
        await tab.scroll.to_bottom(humanize=False, smooth=True)
        await asyncio.sleep(1.5)
        await tab.scroll.to_top(humanize=False, smooth=True)

asyncio.run(scroll_to_positions())
```

!!! tip "Choosing the Right Mode"
    - **`humanize=True`**: Best for anti-bot evasion
    - **Default** (`smooth=True`): Good for demos, screenshots, and general automation
    - **`smooth=False`**: Maximum speed when stealth is not a concern

### Human-Like Scrolling Patterns

Pydoll's scroll engine uses **Cubic Bezier curves** to simulate the physics of human scrolling. This includes:

- **Momentum**: Initial burst of speed followed by gradual deceleration.
- **Friction**: Natural slowing down based on "physical" resistance.
- **Micro-pauses**: Brief stops during long scrolls, mimicking reading or eye movement.
- **Overshoot**: Occasional scrolling past the target and correcting back.

This behavior is automatically enabled when you use `humanize=True`.

```python
import asyncio
import random
from pydoll.browser.chromium import Chrome
from pydoll.constants import ScrollPosition

async def human_like_scrolling():
    """Simulate natural scrolling patterns while reading an article."""
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/article')
        
        # User starts reading from top
        await asyncio.sleep(random.uniform(2.0, 4.0))
        
        # Gradually scroll while reading
        # The scroll engine handles the physics (acceleration/deceleration)
        for _ in range(random.randint(5, 8)):
            # Varied scroll distances (simulates reading speed)
            scroll_distance = random.randint(300, 600)
            await tab.scroll.by(
                ScrollPosition.DOWN, 
                scroll_distance, 
                humanize=True # Enables Bezier curve physics
            )
            
            # Pause to "read" content
            await asyncio.sleep(random.uniform(2.0, 5.0))
        
        # Quick scroll to check the end
        await tab.scroll.to_bottom(humanize=True)
        await asyncio.sleep(random.uniform(1.0, 2.0))
        
        # Scroll back to top to re-read something
        await tab.scroll.to_top(humanize=True)

asyncio.run(human_like_scrolling())
```

### Scrolling Elements into View

Use `scroll_into_view()` to ensure elements are visible before taking page screenshots:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def scroll_for_screenshots():
    """Scroll elements into view before capturing page screenshots."""
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/product')
        
        # Scroll to pricing section before taking full page screenshot
        pricing_section = await tab.find(id="pricing")
        await pricing_section.scroll_into_view()
        await tab.take_screenshot(path="page_with_pricing.png")
        
        # Scroll to reviews section before screenshot
        reviews = await tab.find(class_name="reviews")
        await reviews.scroll_into_view()
        await tab.take_screenshot(path="page_with_reviews.png")
        
        # Scroll to footer to capture complete page state
        footer = await tab.find(tag_name="footer")
        await footer.scroll_into_view()
        await tab.take_screenshot(path="page_with_footer.png")
        
        # Note: click() already scrolls automatically, so no need for:
        # await button.scroll_into_view()  # Unnecessary!
        # await button.click()  # This already scrolls the button into view

asyncio.run(scroll_for_screenshots())
```

### Handling Infinite Scroll Content

Implement scrolling patterns to load lazy-loaded content:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.constants import ScrollPosition

async def infinite_scroll_loading():
    """Load content on infinite scroll pages."""
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/feed')
        
        items_loaded = 0
        max_scrolls = 10
        
        for scroll_num in range(max_scrolls):
            # Scroll to bottom to trigger loading
            await tab.scroll.to_bottom(smooth=True)
            
            # Wait for content to load
            await asyncio.sleep(random.uniform(2.0, 3.0))
            
            # Check if new items were loaded
            items = await tab.find(class_name="feed-item", find_all=True)
            new_count = len(items)
            
            if new_count == items_loaded:
                print("No more content to load")
                break
            
            items_loaded = new_count
            print(f"Scroll {scroll_num + 1}: {items_loaded} items loaded")
            
            # Small scroll up (human behavior)
            if random.random() > 0.7:
                await tab.scroll.by(ScrollPosition.UP, 200, smooth=True)
                await asyncio.sleep(random.uniform(0.5, 1.0))

asyncio.run(infinite_scroll_loading())
```

!!! success "Automatic Completion Waiting"
    Unlike `execute_script("window.scrollBy(...)")` which returns immediately, the `scroll` API uses CDP's `awaitPromise` parameter to wait for the browser's `scrollend` event. This ensures your subsequent actions only execute after scrolling completely finishes.

## Combining Techniques for Maximum Realism

### Complete Form Filling Example

Here's a comprehensive example combining all human-like interaction techniques. **This demonstrates the current manual approach** for achieving maximum realism. Future versions will automate much of this randomization:

```python
import asyncio
import random
from pydoll.browser.chromium import Chrome
from pydoll.constants import Key

async def human_like_form_filling():
    """Fill a form with maximum realism to avoid detection."""
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/registration')
        
        # Wait a bit (user reading the page)
        await asyncio.sleep(random.uniform(1.5, 3.0))
        
        # Fill first name with variable typing speed
        first_name = await tab.find(id="first-name")
        await first_name.click(
            x_offset=random.randint(-5, 5),
            y_offset=random.randint(-5, 5)
        )
        await asyncio.sleep(random.uniform(0.2, 0.5))
        
        # Manual character-by-character typing with randomized delays
        # (This will be automated in future versions)
        name_text = "John"
        for char in name_text:
            await first_name.type_text(char, interval=0)
            await asyncio.sleep(random.uniform(0.08, 0.22))
        
        # Tab to next field
        await asyncio.sleep(random.uniform(0.3, 0.8))
        await first_name.press_keyboard_key(Key.TAB)
        
        # Fill last name
        await asyncio.sleep(random.uniform(0.2, 0.5))
        last_name = await tab.find(id="last-name")
        await last_name.type_text("Doe", interval=random.uniform(0.1, 0.18))
        
        # Tab to email
        await asyncio.sleep(random.uniform(0.4, 1.0))
        await last_name.press_keyboard_key(Key.TAB)
        
        # Fill email with realistic pauses
        await asyncio.sleep(random.uniform(0.2, 0.5))
        email = await tab.find(id="email")
        
        email_text = "john.doe@example.com"
        for i, char in enumerate(email_text):
            await email.type_text(char, interval=0)
            # Longer pause at @ and . symbols (natural)
            if char in ['@', '.']:
                await asyncio.sleep(random.uniform(0.2, 0.4))
            else:
                await asyncio.sleep(random.uniform(0.08, 0.2))
        
        # Simulate user reviewing what they typed
        await asyncio.sleep(random.uniform(1.0, 2.5))
        
        # Accept terms checkbox with offset
        terms_checkbox = await tab.find(id="accept-terms")
        await terms_checkbox.click(
            x_offset=random.randint(-3, 3),
            y_offset=random.randint(-3, 3),
            hold_time=random.uniform(0.08, 0.15)
        )
        
        # Pause before submitting (user reviewing form)
        await asyncio.sleep(random.uniform(1.5, 3.0))
        
        # Click submit with realistic parameters
        submit_button = await tab.find(tag_name="button", type="submit")
        await submit_button.click(
            x_offset=random.randint(-8, 8),
            y_offset=random.randint(-5, 5),
            hold_time=random.uniform(0.1, 0.2)
        )
        
        print("Form submitted with human-like behavior")

asyncio.run(human_like_form_filling())
```

## Best Practices for Avoiding Detection

!!! tip "Manual Randomization Currently Required"
    The following best practices represent the **current state of Pydoll**, where you must manually implement randomization. While this requires more code, it gives you fine-grained control over behavior. Future versions will automate these patterns while maintaining the same level of realism.

### 1. Always Add Random Delays

```python
import asyncio
import random
from pydoll.browser.chromium import Chrome

# Bad: Predictable timing
await element1.click()
await element2.click()
await element3.click()

# Good: Variable timing (currently required)
await element1.click()
await asyncio.sleep(random.uniform(0.5, 1.5))
await element2.click()
await asyncio.sleep(random.uniform(0.8, 2.0))
await element3.click()
```

### 2. Vary Click Positions

```python
import asyncio
import random
from pydoll.browser.chromium import Chrome

# Bad: Always center clicks
for button in buttons:
    await button.click()

# Good: Varied positions (currently manual)
for button in buttons:
    await button.click(
        x_offset=random.randint(-10, 10),
        y_offset=random.randint(-10, 10)
    )
```

### 3. Simulate Natural User Behavior

```python
import asyncio
import random
from pydoll.browser.chromium import Chrome

async def natural_user_simulation(tab):
    # User arrives at page
    await tab.go_to('https://example.com')
    
    # User reads page content (1-3 seconds)
    await asyncio.sleep(random.uniform(1.0, 3.0))
    
    # User scrolls down to see more
    await tab.scroll.by(ScrollPosition.DOWN, 300, smooth=True)
    await asyncio.sleep(random.uniform(0.5, 1.5))
    
    # User finds and clicks button
    button = await tab.find(class_name="cta-button")
    await button.click(
        x_offset=random.randint(-5, 5),
        y_offset=random.randint(-5, 5)
    )
    
    # User waits for content to load
    await asyncio.sleep(random.uniform(0.8, 1.5))
```

### 4. Combine Multiple Techniques

```python
import asyncio
import random
from pydoll.browser.chromium import Chrome

async def advanced_stealth_automation():
    """Combine multiple techniques for maximum stealth."""
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Use human-like page load waiting
        await tab.go_to('https://example.com/sensitive-page')
        await asyncio.sleep(random.uniform(2.0, 4.0))
        
        # Scroll realistically with the dedicated API
        for _ in range(random.randint(2, 4)):
            scroll_amount = random.randint(200, 500)
            await tab.scroll.by(ScrollPosition.DOWN, scroll_amount, smooth=True)
            await asyncio.sleep(random.uniform(0.8, 2.0))
        
        # Find element with timeout (simulating user search)
        target = await tab.find(
            class_name="target-element",
            timeout=random.randint(3, 7)
        )
        
        # Click with all realistic parameters
        await target.click(
            x_offset=random.randint(-12, 12),
            y_offset=random.randint(-8, 8),
            hold_time=random.uniform(0.09, 0.18)
        )
        
        # Human reaction time
        await asyncio.sleep(random.uniform(0.5, 1.2))

asyncio.run(advanced_stealth_automation())
```

## Performance vs Realism Trade-offs

Sometimes you need to balance speed with realism:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def balanced_automation():
    """Choose appropriate realism level based on context."""
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/scraping-target')
        
        # Phase 1: Initial interaction (high realism)
        # This is when detection systems are most active
        login_button = await tab.find(text="Login")
        await asyncio.sleep(random.uniform(1.0, 2.0))
        await login_button.click(
            x_offset=random.randint(-5, 5),
            y_offset=random.randint(-5, 5)
        )
        
        await asyncio.sleep(random.uniform(0.5, 1.0))
        
        username = await tab.find(id="username")
        await username.type_text("user@example.com", interval=0.12)
        
        await asyncio.sleep(random.uniform(0.3, 0.7))
        
        password = await tab.find(id="password")
        await password.type_text("password123", interval=0.10)
        
        submit = await tab.find(type="submit")
        await asyncio.sleep(random.uniform(0.8, 1.5))
        await submit.click()
        
        # Phase 2: Authenticated data extraction (lower realism, higher speed)
        # Less scrutiny after successful authentication
        await asyncio.sleep(2)
        
        # Fast navigation through pages
        items = await tab.find(class_name="data-item", find_all=True)
        
        for item in items:
            # Quick click without offsets
            await item.click_using_js()
            await asyncio.sleep(0.3)  # Minimal delay
            
            # Extract data
            title = await tab.find(class_name="title")
            data = await title.text
            
            # Fast navigation
            await tab.execute_script("window.history.back()")
            await asyncio.sleep(0.5)

asyncio.run(balanced_automation())
```

## Monitoring and Adjusting

Test your automation's realism:

```python
import asyncio
import random
import time
from pydoll.browser.chromium import Chrome

async def test_interaction_timing():
    """Log timing to ensure realistic patterns."""
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/test-page')
        
        # Measure and log interaction timing
        elements = await tab.find(class_name="clickable", find_all=True)
        
        timings = []
        last_time = time.time()
        
        for i, element in enumerate(elements):
            await element.click(
                x_offset=random.randint(-8, 8),
                y_offset=random.randint(-8, 8)
            )
            
            current_time = time.time()
            elapsed = current_time - last_time
            timings.append(elapsed)
            
            print(f"Click {i+1}: {elapsed:.3f}s since last action")
            last_time = current_time
            
            await asyncio.sleep(random.uniform(0.5, 2.0))
        
        # Analyze timing distribution
        avg_time = sum(timings) / len(timings)
        print(f"\nAverage time between actions: {avg_time:.3f}s")
        print(f"Min: {min(timings):.3f}s, Max: {max(timings):.3f}s")
        
        # Good: Variable timing with realistic average (1-2 seconds)
        # Bad: Constant timing or unrealistically fast (<0.1s)

asyncio.run(test_interaction_timing())
```

## Learn More

For more information about element interaction methods:

- **[Element Finding](../element-finding.md)**: Locate elements to interact with
- **[WebElement Domain](../../deep-dive/webelement-domain.md)**: Deep dive into WebElement capabilities
- **[File Operations](file-operations.md)**: Upload files and handle downloads

Master human-like interactions, and your automation will be more reliable, harder to detect, and more closely mirror real user behavior.


================================================
FILE: docs/en/features/automation/iframes.md
================================================
# Working with IFrames

Modern web pages embed content from other documents using `<iframe>`. In previous versions of Pydoll you had to convert an iframe into a `Tab` using `tab.get_frame()` and keep track of CDP targets manually. **That is no longer necessary.**  
An iframe nowadays behaves like any other `WebElement`: you can call `find()`, `query()`, `execute_script()`, `inner_html`, `text`, and all element helpers directly—Pydoll will transparently execute the request inside the correct browsing context.

!!! info "Simpler mental model"
    Treat an iframe exactly like a div: locate it once and use it as the starting point for new element searches. Pydoll handles cross-origin frames, isolated execution contexts, and nested frames behind the scenes.

## Quick Start

### Interact with the first iframe on the page

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def interact_with_iframe():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/page-with-iframe')

        iframe = await tab.find(tag_name='iframe', id='content-frame')

        # These methods execute inside the iframe automatically
        title = await iframe.find(tag_name='h1')
        await title.click()

        form = await iframe.find(id='login-form')
        username = await form.find(name='username')
        await username.type_text('john_doe')

asyncio.run(interact_with_iframe())
```

### Nested iframes

Need to reach a frame inside another frame? Chain your searches:

```python
outer = await tab.find(id='outer-frame')
inner = await outer.find(tag_name='iframe')   # Search inside the outer iframe

submit_button = await inner.find(id='submit')
await submit_button.click()
```

The algorithm is always the same:

1. Find the iframe element.
2. Use that `WebElement` to continue searching.
3. Repeat for deeper levels if required.

There is no need to cache frame targets or create additional `Tab` instances.

### Execute JavaScript in an iframe

```python
iframe = await tab.find(tag_name='iframe')
result = await iframe.execute_script('return document.title', return_by_value=True)
print(result['result']['result']['value'])
```

Pydoll automatically runs the script within the iframe’s isolated execution context (cross-origin and same-origin frames work the same way).

## Why this is better

- **Intuitive:** what you see in the DOM tree is what you code—if you can select the `iframe` element, you can interact with everything inside it.
- **Cross-origin friendly:** Pydoll spins up an isolated world for you; no more manual target resolution.
- **Nested by design:** each search is scoped to the element you call it on, so deep hierarchies stay manageable.
- **No API split:** you do not have to switch between `Tab` and `WebElement` methods—one set of primitives is enough.

!!! tip "Deprecation notice"
    `Tab.get_frame()` now emits a `DeprecationWarning` and will be removed in a future release. Update existing snippets to work directly with iframe elements as shown above.

## Frequently used patterns

### Take a screenshot from inside an iframe

```python
iframe = await tab.find(tag_name='iframe')
chart = await iframe.find(id='sales-chart')
await chart.take_screenshot('chart.png')
```


## Cross-iframe Selectors

Instead of manually finding each iframe and then searching inside it, you can write a **single selector** that crosses iframe boundaries. Pydoll automatically detects `iframe` steps in your XPath or CSS selector, splits them into segments, and walks the iframe chain for you.

### CSS selectors

Use any standard combinator (`>`, space) after an `iframe` compound:

```python
# Single iframe crossing
button = await tab.query('iframe > .submit-btn')

# With attribute selectors on the iframe
button = await tab.query('iframe[src*="checkout"] > #pay-button')

# Nested iframes
element = await tab.query('iframe.outer > iframe.inner > div.content')

# Multiple steps after the iframe
link = await tab.query('iframe > nav > a.home-link')

# Iframe inside another element (not at root)
button = await tab.query('div > iframe > button.submit')
content = await tab.query('.wrapper iframe > div.content')
```

### XPath expressions

Use `/` after an `iframe` step — Pydoll splits at the iframe node:

```python
# Single iframe crossing
button = await tab.query('//iframe/body/button[@id="submit"]')

# Iframe inside another element (not at root)
div = await tab.query('//div/iframe/div')
item = await tab.query('//div[@class="wrapper"]/iframe/body/div')

# With predicates on the iframe
heading = await tab.query('//iframe[@src*="cloudflare"]//h1')

# Nested iframes
element = await tab.query('//iframe[@id="outer"]//iframe[@id="inner"]//div')
```

### How it works

When Pydoll encounters a selector like `iframe[src*="checkout"] > form > button`:

1. **Parses** the selector into segments: `iframe[src*="checkout"]` and `form > button`
2. **Finds** the iframe element using the first segment
3. **Searches inside** the iframe using the second segment
4. For nested iframes, repeats the process at each boundary

This is equivalent to the manual approach but in a single call:

```python
# Manual (still works)
iframe = await tab.find(tag_name='iframe', src='*checkout*')
button = await iframe.query('form > button')

# Automatic (same result, one line)
button = await tab.query('iframe[src*="checkout"] > form > button')
```

### When splitting does NOT happen

Selectors are only split when `iframe` appears as a **tag name**. These selectors pass through unchanged:

- `.iframe > body` — class selector, not a tag
- `#iframe > body` — ID selector
- `div.iframe > body` — tag is `div`, not `iframe`
- `[data-type="iframe"] > body` — attribute selector
- `iframe` or `//iframe` — no content after iframe (nothing to search inside)

### find_all support

The last segment respects `find_all=True`, returning all matching elements inside the final iframe:

```python
# Get all links inside an iframe
links = await tab.query('iframe > a', find_all=True)
```

## Best practices

- **Use the iframe element as scope:** call `find`, `query`, or other helpers on the iframe itself.
- **Avoid `tab.find` for inner content:** it only sees the top-level document.
- **Remember partial results:** if you need the same iframe repeatedly, store the `WebElement` reference; Pydoll keeps the underlying context cached.
- **Keep existing element workflows:** everything that works for a normal element (scrolling, screenshot, scripts, waiting) works for an iframe element too.

## Further reading

- **[Element Finding](../element-finding.md)** – covers scoped searches and chaining.
- **[Screenshots & PDFs](screenshots-and-pdfs.md)** – details about capturing visual output.
- **[Event System](../advanced/event-system.md)** – reactively monitor page activity, including frames.

Once you adapt to the new model, iframes become just another part of the DOM tree. Focus on building your automation logic—Pydoll takes care of the frame plumbing for you.


================================================
FILE: docs/en/features/automation/keyboard-control.md
================================================
# Keyboard Control

The Keyboard API provides complete control over keyboard input at the page level, enabling you to simulate realistic typing, execute shortcuts, and control complex key sequences. Unlike element-level keyboard methods, the Keyboard API operates globally on the page, giving you the flexibility to interact with any focused element or trigger page-level keyboard actions.

!!! info "Centralized Keyboard Interface"
    All keyboard operations are accessible via `tab.keyboard`, providing a clean, unified API for all keyboard interactions.

!!! warning "Important CDP Limitation: Browser UI Shortcuts Don't Work"
    **Known Issue**: Events injected via Chrome DevTools Protocol are marked as "untrusted" and do **not** trigger browser UI actions or create user gestures.
    
    **What DOESN'T work:**

    - Browser shortcuts (Ctrl+T, Ctrl+W, Ctrl+N)
    - DevTools shortcuts (F12, Ctrl+Shift+I)
    - Browser navigation (Ctrl+Shift+T to reopen tabs)
    - Any shortcut that modifies browser UI or windows
    
    **What WORKS perfectly:**

    - Page-level shortcuts (Ctrl+A, Ctrl+C, Ctrl+V, Ctrl+F)
    - Text selection and manipulation
    - Form navigation (Tab, Enter, Arrow keys)
    - Input field interactions
    - Custom application shortcuts (in web apps)
    
    **Technical reason**: CDP events don't create "user gestures" required by browser security. See [chromium issue #615341](https://bugs.chromium.org/p/chromium/issues/detail?id=615341) and [CDP documentation](https://chromedevtools.github.io/devtools-protocol/tot/Input/#method-dispatchKeyEvent).
    
    For browser-level automation, use CDP browser commands directly (like `tab.close()`, `browser.new_tab()`) instead of keyboard shortcuts.

## Quick Start

The Keyboard API provides three primary methods:

```python
from pydoll.browser.chromium import Chrome
from pydoll.constants import Key

async with Chrome() as browser:
    tab = await browser.start()
    await tab.go_to('https://example.com')

    # Press and release a key
    await tab.keyboard.press(Key.ENTER)
    
    # Execute a hotkey combination
    await tab.keyboard.hotkey(Key.CONTROL, Key.S)  # Ctrl+S
    
    # Manual control
    await tab.keyboard.down(Key.SHIFT)
    await tab.keyboard.press(Key.ARROWRIGHT)
    await tab.keyboard.up(Key.SHIFT)
```

## Core Methods

### Press: Complete Key Action

The `press()` method executes a full key press cycle (down → wait → up):

```python
from pydoll.constants import Key

# Basic key press
await tab.keyboard.press(Key.ENTER)
await tab.keyboard.press(Key.TAB)
await tab.keyboard.press(Key.ESCAPE)

# Press with modifiers
await tab.keyboard.press(Key.S, modifiers=2)  # Ctrl+S (manual modifier)

# Custom hold duration
await tab.keyboard.press(Key.SPACE, interval=0.5)  # Hold for 500ms
```

**Parameters:**

- `key`: Key to press (from `Key` enum)
- `modifiers` (optional): Modifier flags (Alt=1, Ctrl=2, Meta=4, Shift=8)
- `interval` (optional): Duration to hold key in seconds (default: 0.1)

### Down: Press Key Without Releasing

The `down()` method presses a key without releasing it, useful for holding modifiers or creating key sequences:

```python
from pydoll.constants import Key

# Hold Shift while pressing other keys
await tab.keyboard.down(Key.SHIFT)
await tab.keyboard.press(Key.ARROWRIGHT)  # Select text
await tab.keyboard.press(Key.ARROWRIGHT)  # Continue selecting
await tab.keyboard.up(Key.SHIFT)

# Press with modifier flags
await tab.keyboard.down(Key.A, modifiers=2)  # Ctrl+A (select all)
```

**Parameters:**

- `key`: Key to press down
- `modifiers` (optional): Modifier flags to apply

### Up: Release a Key

The `up()` method releases a previously pressed key:

```python
from pydoll.constants import Key

# Manual key sequence
await tab.keyboard.down(Key.CONTROL)
await tab.keyboard.down(Key.SHIFT)
await tab.keyboard.press(Key.T)  # Ctrl+Shift+T
await tab.keyboard.up(Key.SHIFT)
await tab.keyboard.up(Key.CONTROL)
```

**Parameters:**

- `key`: Key to release

!!! tip "When to Use Each Method"

    - **`press()`**: Single key actions (Enter, Tab, letters)
    - **`hotkey()`**: Keyboard shortcuts (Ctrl+C, Ctrl+Shift+T)
    - **`down()`/`up()`**: Complex sequences, holding modifiers, custom timing

## Hotkeys: Keyboard Shortcuts Made Easy

The `hotkey()` method automatically detects modifier keys and executes shortcuts correctly:

### Basic Hotkeys

```python
from pydoll.constants import Key

# Common shortcuts
await tab.keyboard.hotkey(Key.CONTROL, Key.C)  # Copy
await tab.keyboard.hotkey(Key.CONTROL, Key.V)  # Paste
await tab.keyboard.hotkey(Key.CONTROL, Key.X)  # Cut
await tab.keyboard.hotkey(Key.CONTROL, Key.Z)  # Undo
await tab.keyboard.hotkey(Key.CONTROL, Key.Y)  # Redo
await tab.keyboard.hotkey(Key.CONTROL, Key.A)  # Select all
await tab.keyboard.hotkey(Key.CONTROL, Key.S)  # Save

```

### Three-Key Combinations

```python
from pydoll.constants import Key

# Text editing shortcuts (these work!)
await tab.keyboard.hotkey(Key.CONTROL, Key.SHIFT, Key.ARROWLEFT)  # Select word left
await tab.keyboard.hotkey(Key.CONTROL, Key.SHIFT, Key.ARROWRIGHT)  # Select word right
await tab.keyboard.hotkey(Key.CONTROL, Key.SHIFT, Key.HOME)  # Select to start of document
await tab.keyboard.hotkey(Key.CONTROL, Key.SHIFT, Key.END)  # Select to end of document

# Application-specific shortcuts (if supported by the web app)
await tab.keyboard.hotkey(Key.CONTROL, Key.SHIFT, Key.Z)  # Redo in many apps
await tab.keyboard.hotkey(Key.CONTROL, Key.SHIFT, Key.S)  # Save As (if app supports it)
```

### Platform-Specific Shortcuts

```python
import sys
from pydoll.constants import Key

# Use Meta (Command) on macOS, Control on Windows/Linux
modifier = Key.META if sys.platform == 'darwin' else Key.CONTROL

await tab.keyboard.hotkey(modifier, Key.C)  # Copy (platform-aware)
await tab.keyboard.hotkey(modifier, Key.V)  # Paste (platform-aware)
```

### How Hotkeys Work

The `hotkey()` method intelligently handles modifier keys:

1. **Detects modifiers**: Automatically identifies Ctrl, Shift, Alt, Meta
2. **Calculates flags**: Combines modifiers using bitwise OR (Ctrl=2, Shift=8 → 10)
3. **Applies correctly**: Presses non-modifier keys with modifier flags applied
4. **Clean release**: Releases keys in reverse order

```python
from pydoll.constants import Key

# Behind the scenes for hotkey(Key.CONTROL, Key.SHIFT, Key.T):
# 1. Detect: modifiers=[CONTROL, SHIFT], keys=[T]
# 2. Calculate: modifier_value = 2 | 8 = 10
# 3. Execute: press T with modifiers=10
# 4. Release: release T
```

!!! tip "Modifier Values"
    When using `modifiers` parameter manually:

    - Alt = 1
    - Ctrl = 2
    - Meta/Command = 4
    - Shift = 8
    
    Combine them: Ctrl+Shift = 2 + 8 = 10

## Available Keys

The `Key` enum provides comprehensive keyboard coverage:

### Letter Keys (A-Z)

```python
from pydoll.constants import Key

# All letters A through Z
await tab.keyboard.press(Key.A)
await tab.keyboard.press(Key.Z)
```

### Number Keys

```python
from pydoll.constants import Key

# Top row numbers (0-9)
await tab.keyboard.press(Key.DIGIT0)
await tab.keyboard.press(Key.DIGIT9)

# Numpad numbers
await tab.keyboard.press(Key.NUMPAD0)
await tab.keyboard.press(Key.NUMPAD9)
```

### Function Keys

```python
from pydoll.constants import Key

# F1 through F12
await tab.keyboard.press(Key.F1)
await tab.keyboard.press(Key.F12)
```

### Navigation Keys

```python
from pydoll.constants import Key

await tab.keyboard.press(Key.ARROWUP)
await tab.keyboard.press(Key.ARROWDOWN)
await tab.keyboard.press(Key.ARROWLEFT)
await tab.keyboard.press(Key.ARROWRIGHT)
await tab.keyboard.press(Key.HOME)
await tab.keyboard.press(Key.END)
await tab.keyboard.press(Key.PAGEUP)
await tab.keyboard.press(Key.PAGEDOWN)
```

### Modifier Keys

```python
from pydoll.constants import Key

await tab.keyboard.press(Key.CONTROL)
await tab.keyboard.press(Key.SHIFT)
await tab.keyboard.press(Key.ALT)
await tab.keyboard.press(Key.META)  # Command on macOS, Windows key on Windows
```

### Special Keys

```python
from pydoll.constants import Key

await tab.keyboard.press(Key.ENTER)
await tab.keyboard.press(Key.TAB)
await tab.keyboard.press(Key.SPACE)
await tab.keyboard.press(Key.BACKSPACE)
await tab.keyboard.press(Key.DELETE)
await tab.keyboard.press(Key.ESCAPE)
await tab.keyboard.press(Key.INSERT)
```

## Practical Examples

### Form Navigation

```python
from pydoll.browser import Chrome
from pydoll.constants import Key

async def fill_form_with_keyboard():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/form')
        
        # Focus first field and type
        first_field = await tab.find(id='name')
        await first_field.click()
        await first_field.insert_text('John Doe')
        
        # Navigate to next field with Tab
        await tab.keyboard.press(Key.TAB)
        await tab.keyboard.press(Key.TAB)  # Skip a field
        
        # Type in current focused field
        second_field = await tab.find(id='email')
        await second_field.insert_text('john@example.com')
        
        # Submit with Enter
        await tab.keyboard.press(Key.ENTER)
```

### Text Selection and Manipulation

```python
from pydoll.constants import Key

async def select_and_replace_text():
    # Select all text
    await tab.keyboard.hotkey(Key.CONTROL, Key.A)
    
    # Copy selection
    await tab.keyboard.hotkey(Key.CONTROL, Key.C)
    
    # Move to end
    await tab.keyboard.press(Key.END)
    
    # Select word by word
    await tab.keyboard.down(Key.CONTROL)
    await tab.keyboard.down(Key.SHIFT)
    await tab.keyboard.press(Key.ARROWLEFT)
    await tab.keyboard.press(Key.ARROWLEFT)
    await tab.keyboard.up(Key.SHIFT)
    await tab.keyboard.up(Key.CONTROL)
    
    # Delete selection
    await tab.keyboard.press(Key.DELETE)
```

### Dropdown and Select Navigation

```python
from pydoll.constants import Key

async def navigate_dropdown():
    # Open dropdown
    select = await tab.find(tag_name='select')
    await select.click()
    
    # Navigate options with arrow keys
    await tab.keyboard.press(Key.ARROWDOWN)
    await tab.keyboard.press(Key.ARROWDOWN)
    
    # Select with Enter
    await tab.keyboard.press(Key.ENTER)
    
    # Or cancel with Escape
    await tab.keyboard.press(Key.ESCAPE)
```

### Complex Key Sequences

```python
from pydoll.constants import Key
import asyncio

async def complex_editing():
    # Select line
    await tab.keyboard.press(Key.HOME)  # Go to start
    await tab.keyboard.down(Key.SHIFT)
    await tab.keyboard.press(Key.END)  # Select to end
    await tab.keyboard.up(Key.SHIFT)
    
    # Cut
    await tab.keyboard.hotkey(Key.CONTROL, Key.X)
    
    # Move down and paste
    await tab.keyboard.press(Key.ARROWDOWN)
    await tab.keyboard.hotkey(Key.CONTROL, Key.V)
    
    # Undo if needed
    await tab.keyboard.hotkey(Key.CONTROL, Key.Z)
```

## Best Practices

### 1. Add Delays for Reliability

```python
from pydoll.constants import Key
import asyncio

# Good: Wait for UI to update
await tab.keyboard.hotkey(Key.CONTROL, Key.F)  # Open find
await asyncio.sleep(0.2)  # Wait for dialog
await tab.keyboard.press(Key.ESCAPE)  # Close it

# Bad: No delay, it might not work
await tab.keyboard.hotkey(Key.CONTROL, Key.F)
await tab.keyboard.press(Key.ESCAPE)  # Might be too fast
```

### 2. Focus Elements Before Typing

```python
from pydoll.constants import Key

# Good: Ensure element is focused
input_field = await tab.find(id='search')
await input_field.click()  # Focus it
await input_field.insert_text('query')

# Bad: Keyboard input goes to wrong element
await tab.keyboard.press(Key.A)  # Where does this go?
```

### 3. Use Platform-Aware Shortcuts

```python
import sys
from pydoll.constants import Key

# Good: Platform-aware
cmd_key = Key.META if sys.platform == 'darwin' else Key.CONTROL
await tab.keyboard.hotkey(cmd_key, Key.C)

# Bad: Hardcoded (won't work on macOS)
await tab.keyboard.hotkey(Key.CONTROL, Key.C)
```

### 4. Clean Up Long Sequences

```python
from pydoll.constants import Key

# Good: Ensure modifiers are released
try:
    await tab.keyboard.down(Key.SHIFT)
    await tab.keyboard.press(Key.ARROWRIGHT)
    # ... more operations
finally:
    await tab.keyboard.up(Key.SHIFT)  # Always release

# Bad: Modifier stays pressed on error
await tab.keyboard.down(Key.SHIFT)
await tab.keyboard.press(Key.ARROWRIGHT)
# Error here leaves Shift pressed!
```

## Key Reference Tables

### Common Page-Level Shortcuts (These Work!)

| Action | Windows/Linux | macOS | Notes |
|--------|--------------|-------|-------|
| Copy | Ctrl+C | Cmd+C | Works |
| Paste | Ctrl+V | Cmd+V | Works |
| Cut | Ctrl+X | Cmd+X | Works |
| Undo | Ctrl+Z | Cmd+Z | Works |
| Redo | Ctrl+Y | Cmd+Y | Works |
| Select All | Ctrl+A | Cmd+A | Works |
| Find | Ctrl+F | Cmd+F | Only if web app implements it |
| Save | Ctrl+S | Cmd+S | Only if web app implements it |
| Refresh | F5 or Ctrl+R | Cmd+R | Use `await tab.refresh()` instead |

### Browser Shortcuts (These DON'T Work via CDP)

| Action | Shortcut | Use Instead |
|--------|----------|-------------|
| New Tab | Ctrl+T | `await browser.new_tab()` |
| Close Tab | Ctrl+W | `await tab.close()` |
| Reopen Tab | Ctrl+Shift+T | Track tabs manually |
| DevTools | F12, Ctrl+Shift+I | Already available via CDP! |
| Address Bar | Ctrl+L | `await tab.go_to(url)` |

### All Available Keys

| Category | Keys |
|----------|------|
| **Letters** | `Key.A` through `Key.Z` (26 keys) |
| **Numbers** | `Key.DIGIT0` through `Key.DIGIT9` (10 keys) |
| **Numpad** | `Key.NUMPAD0` through `Key.NUMPAD9`, `NUMPADMULTIPLY`, `NUMPADADD`, `NUMPADSUBTRACT`, `NUMPADDECIMAL`, `NUMPADDIVIDE` |
| **Function** | `Key.F1` through `Key.F12` (12 keys) |
| **Navigation** | `ARROWUP`, `ARROWDOWN`, `ARROWLEFT`, `ARROWRIGHT`, `HOME`, `END`, `PAGEUP`, `PAGEDOWN` |
| **Modifiers** | `CONTROL`, `SHIFT`, `ALT`, `META` |
| **Special** | `ENTER`, `TAB`, `SPACE`, `BACKSPACE`, `DELETE`, `ESCAPE`, `INSERT` |
| **Locks** | `CAPSLOCK`, `NUMLOCK`, `SCROLLLOCK` |
| **Symbols** | `SEMICOLON`, `EQUALSIGN`, `COMMA`, `MINUS`, `PERIOD`, `SLASH`, `GRAVEACCENT`, `BRACKETLEFT`, `BACKSLASH`, `BRACKETRIGHT`, `QUOTE` |

### Modifier Flag Values

| Modifier | Value | Binary | Usage |
|----------|-------|--------|-------|
| Alt | 1 | 0001 | `modifiers=1` |
| Ctrl | 2 | 0010 | `modifiers=2` |
| Meta | 4 | 0100 | `modifiers=4` |
| Shift | 8 | 1000 | `modifiers=8` |
| Ctrl+Shift | 10 | 1010 | `modifiers=10` |
| Ctrl+Alt | 3 | 0011 | `modifiers=3` |
| Ctrl+Shift+Alt | 11 | 1011 | `modifiers=11` |

## Migration from WebElement Methods

Previous keyboard methods on `WebElement` are deprecated. Here's how to migrate:

### Old vs New

```python
from pydoll.constants import Key

# Old (deprecated)
element = await tab.find(id='input')
await element.key_down(Key.A, modifiers=2)
await element.key_up(Key.A)
await element.press_keyboard_key(Key.ENTER)

# New (recommended)
await tab.keyboard.down(Key.A, modifiers=2)
await tab.keyboard.up(Key.A)
await tab.keyboard.press(Key.ENTER)
```

!!! warning "Deprecation Notice"
    The following `WebElement` methods are deprecated:

    - `key_down()` → Use `tab.keyboard.down()`
    - `key_up()` → Use `tab.keyboard.up()`
    - `press_keyboard_key()` → Use `tab.keyboard.press()`
    
    These methods still work for backward compatibility but will show deprecation warnings.

### Why Migrate?

- **Centralized**: All keyboard operations in one place
- **Cleaner API**: Consistent interface for all keyboard actions
- **More powerful**: Hotkey support, smart modifier detection
- **Better typed**: Full IDE autocomplete support

## Learn More

For additional automation capabilities:

- **[Human Interactions](human-interactions.md)**: Realistic clicking, scrolling, and mouse movement
- **[Form Handling](form-handling.md)**: Complete form automation workflows
- **[File Operations](file-operations.md)**: File upload automation

The Keyboard API eliminates the complexity of keyboard automation, providing clean, reliable methods for everything from simple key presses to complex shortcuts and sequences.


================================================
FILE: docs/en/features/automation/mouse-control.md
================================================
# Mouse Control

The Mouse API provides complete control over mouse input at the page level, enabling you to simulate realistic cursor movement, clicks, double-clicks, and drag operations. When `humanize=True` is passed, mouse operations use humanized simulation: paths follow natural Bezier curves with Fitts's Law timing, minimum-jerk velocity profiles, physiological tremor, and overshoot correction, making automation virtually indistinguishable from human behavior.

!!! info "Centralized Mouse Interface"
    All mouse operations are accessible via `tab.mouse`, providing a clean, unified API for all mouse interactions.

## Quick Start

```python
from pydoll.browser.chromium import Chrome
from pydoll.protocol.input.types import MouseButton

async with Chrome() as browser:
    tab = await browser.start()
    await tab.go_to('https://example.com')

    # Move cursor to position
    await tab.mouse.move(500, 300)

    # Click at position
    await tab.mouse.click(500, 300)

    # Right-click
    await tab.mouse.click(500, 300, button=MouseButton.RIGHT)

    # Double-click
    await tab.mouse.double_click(500, 300)

    # Drag from one position to another
    await tab.mouse.drag(100, 200, 500, 400)
```

## Core Methods

### move: Move Cursor

Move the mouse cursor to a specific position on the page:

```python
# Default move (single CDP event, no simulation)
await tab.mouse.move(500, 300)

# Humanized move (curved path with natural timing)
await tab.mouse.move(500, 300, humanize=True)
```

**Parameters:**

- `x`: Target X coordinate (CSS pixels)
- `y`: Target Y coordinate (CSS pixels)
- `humanize` (keyword-only): Simulate human-like curved movement (default: `False`)

### click: Click at Position

Move to position and perform a mouse click:

```python
from pydoll.protocol.input.types import MouseButton

# Left click (default, instant)
await tab.mouse.click(500, 300)

# Right click
await tab.mouse.click(500, 300, button=MouseButton.RIGHT)

# Double click via click_count
await tab.mouse.click(500, 300, click_count=2)

# Humanized click with natural movement
await tab.mouse.click(500, 300, humanize=True)
```

**Parameters:**

- `x`: Target X coordinate
- `y`: Target Y coordinate
- `button` (keyword-only): Mouse button, one of `LEFT`, `RIGHT`, `MIDDLE` (default: `LEFT`)
- `click_count` (keyword-only): Number of clicks (default: `1`)
- `humanize` (keyword-only): Simulate human-like behavior (default: `False`)

### double_click: Double-Click at Position

Convenience method equivalent to `click(x, y, click_count=2)`:

```python
await tab.mouse.double_click(500, 300)
await tab.mouse.double_click(500, 300, humanize=False)
```

### down / up: Low-Level Button Control

Press or release mouse buttons independently:

```python
# Press left button at current position
await tab.mouse.down()

# Release left button
await tab.mouse.up()

# Right button
await tab.mouse.down(button=MouseButton.RIGHT)
await tab.mouse.up(button=MouseButton.RIGHT)
```

These are primitives that operate at the current cursor position and have no `humanize` parameter.

### drag: Drag and Drop

Move from start to end while holding the mouse button:

```python
# Default drag (instant)
await tab.mouse.drag(100, 200, 500, 400)

# Humanized drag with natural movement
await tab.mouse.drag(100, 200, 500, 400, humanize=True)
```

**Parameters:**

- `start_x`, `start_y`: Start coordinates
- `end_x`, `end_y`: End coordinates
- `humanize` (keyword-only): Simulate human-like drag (default: `False`)

## Enabling Humanization

All mouse methods default to `humanize=False`. To enable humanized simulation with natural Bezier curve paths and realistic timing, pass `humanize=True`:

```python
# Humanized move, natural curved path with Fitts's Law timing
await tab.mouse.move(500, 300, humanize=True)

# Humanized click: curved movement + pre-click pause + press + release
await tab.mouse.click(500, 300, humanize=True)

# Humanized drag, natural curves and pauses
await tab.mouse.drag(100, 200, 500, 400, humanize=True)
```

This is recommended when detection evasion is important, for example when interacting with sites that employ bot detection.

## Humanized Mode

When `humanize=True` is passed, the mouse module applies multiple layers of realism:

### Bezier Curve Paths

Mouse follows a natural curved trajectory instead of a straight line. Control points are randomly offset perpendicular to the start→end line, with asymmetric placement (more curvature early in the movement, like a real ballistic reach).

### Fitts's Law Timing

Movement duration follows Fitts's Law: `MT = a + b × log₂(D/W + 1)`. Longer distances take proportionally more time, matching human motor control behavior.

### Minimum-Jerk Velocity Profile

The cursor follows a bell-shaped speed profile, starting slow, accelerating to peak velocity in the middle, then decelerating at the end. This matches the smoothest possible human movement trajectory.

### Physiological Tremor

Small Gaussian noise (σ ≈ 1px) is added to each frame, simulating hand tremor. The tremor amplitude scales inversely with velocity, with more tremor when the cursor is slow or hovering and less during fast ballistic movements.

### Overshoot and Correction

For fast, long-distance movements (~70% probability), the cursor overshoots the target by 3–12% of the distance, then makes a small corrective sub-movement back to the target. This matches real human motor control data.

### Pre-Click Pause

Humanized clicks include a pre-click pause (50–200ms) that simulates the natural settle time before pressing the button.

## Automatic Humanized Element Clicks

When you use `element.click(humanize=True)`, the Mouse API is used to produce a realistic Bezier curve movement from the current cursor position to the element center before clicking, making element clicks indistinguishable from human behavior.

```python
# Default click: raw CDP press/release
button = await tab.find(id='submit')
await button.click()

# With offset from center
await button.click(x_offset=10, y_offset=5)

# Humanized click: Bezier curve movement + click
await button.click(humanize=True)
```

Position tracking is maintained across element clicks. Clicking element A, then element B, produces a natural curved path from A's position to B.

## Custom Timing Configuration

All humanization parameters are configurable via `MouseTimingConfig`:

```python
from pydoll.interactions.mouse import MouseTimingConfig

config = MouseTimingConfig(
    fitts_a=0.070,              # Fitts's Law intercept (seconds)
    fitts_b=0.150,              # Fitts's Law slope (seconds/bit)
    frame_interval=0.012,       # Base interval between mouseMoved events
    curvature_min=0.10,         # Min path curvature as fraction of distance
    curvature_max=0.30,         # Max path curvature
    tremor_amplitude=1.0,       # Tremor sigma in pixels
    overshoot_probability=0.70, # Chance of overshoot on fast moves
    min_duration=0.08,          # Minimum movement duration
    max_duration=2.5,           # Maximum movement duration
)

# Apply to the tab's mouse instance
tab.mouse.timing = config
```

See the `MouseTimingConfig` dataclass for all available parameters.

## Position Tracking

The Mouse API tracks the cursor position across operations:

```python
# Initial position is (0, 0)
await tab.mouse.move(100, 200)
# Position is now (100, 200)

await tab.mouse.click(300, 400)
# Position is now (300, 400)

# Low-level methods use the tracked position
await tab.mouse.down()   # Presses at (300, 400)
await tab.mouse.up()     # Releases at (300, 400)
```

!!! note "Position State"
    The mouse position is tracked internally. `WebElement.click()` automatically uses `tab.mouse` when available, so position tracking is maintained across element clicks.

## Debug Mode

Enable debug mode to visualize mouse movement on the page. When active, colored dots are drawn on a transparent overlay canvas:

- **Blue dots**: cursor path during movement
- **Red dots**: click positions

```python
# Enable at runtime via property
tab.mouse.debug = True

# Now all movements draw colored dots
await tab.mouse.click(500, 300)

# Disable when done
tab.mouse.debug = False
```

This is useful for tuning timing parameters and verifying that paths look natural.

## Practical Examples

### Click a Button with Realistic Movement

```python
async def click_button_naturally(tab):
    # element.click() automatically uses tab.mouse for humanized movement
    button = await tab.find(id='submit')
    await button.click()
```

### Drag a Slider

```python
async def drag_slider(tab):
    slider = await tab.find(css_selector='.slider-handle')
    bounds = await slider.get_bounds_using_js()

    start_x = bounds['x'] + bounds['width'] / 2
    start_y = bounds['y'] + bounds['height'] / 2
    end_x = start_x + 200  # Drag 200px to the right

    await tab.mouse.drag(start_x, start_y, end_x, start_y)
```

### Hover Over Elements

```python
async def hover_menu(tab):
    menu = await tab.find(css_selector='.dropdown-trigger')
    bounds = await menu.get_bounds_using_js()

    await tab.mouse.move(
        bounds['x'] + bounds['width'] / 2,
        bounds['y'] + bounds['height'] / 2,
    )
    # Menu should now be visible via CSS :hover
```

## Learn More

- **[Human Interactions](human-interactions.md)**: Overview of all humanized interactions
- **[Keyboard Control](keyboard-control.md)**: Realistic keyboard simulation


================================================
FILE: docs/en/features/automation/screenshots-and-pdfs.md
================================================
# Screenshots and PDFs

Pydoll provides powerful screenshot and PDF generation capabilities through direct Chrome DevTools Protocol commands. Capture full pages, specific elements, or generate PDFs with fine-grained control.

## Screenshots

### Basic Page Screenshot

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def take_page_screenshot():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # Save screenshot to file
        await tab.take_screenshot('page.png', quality=100)

asyncio.run(take_page_screenshot())
```

### Supported Formats

Pydoll supports three image formats based on file extension:

```python
# PNG format (lossless, larger file size)
await tab.take_screenshot('screenshot.png', quality=100)

# JPEG format (lossy, smaller file size)
await tab.take_screenshot('screenshot.jpeg', quality=85)

# WebP format (modern, efficient)
await tab.take_screenshot('screenshot.webp', quality=90)
```

!!! info "Format Detection"
    The image format is automatically determined by the file extension. Using an unsupported extension raises `InvalidFileExtension`.
    
    Both `.jpg` and `.jpeg` are supported for JPEG format (`.jpg` is automatically normalized to `.jpeg` internally to match CDP requirements).

### Screenshot Parameters

| Parameter | Type | Default | Description |
|-----------|------|---------|-------------|
| `path` | `Optional[str]` | `None` | File path to save screenshot. Required if `as_base64=False`. |
| `quality` | `int` | `100` | Image quality (0-100). Higher values mean better quality and larger files. |
| `beyond_viewport` | `bool` | `False` | Capture entire scrollable page, not just visible area. |
| `as_base64` | `bool` | `False` | Return base64-encoded string instead of saving to file. |

### Full Page Screenshot

Capture content beyond the visible viewport:

```python
async def full_page_screenshot():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/long-page')
        
        # Capture entire page including content below the fold
        await tab.take_screenshot(
            'full-page.png',
            beyond_viewport=True,
            quality=90
        )
```

!!! warning "Performance Note"
    Using `beyond_viewport=True` on very long pages can consume significant memory and take longer to process.

### Base64 Screenshot

Get screenshot as base64 string for embedding or sending via API:

```python
async def base64_screenshot():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # Get screenshot as base64 string
        screenshot_base64 = await tab.take_screenshot(
            as_base64=True
        )
        
        # Use in HTML img tag
        html = f'<img src="data:image/png;base64,{screenshot_base64}" />'
        
        # Or send via API
        import aiohttp
        async with aiohttp.ClientSession() as session:
            await session.post(
                'https://api.example.com/upload',
                json={'image': screenshot_base64}
            )
```

### Element Screenshot

Capture specific elements instead of the entire page:

```python
async def element_screenshot():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # Screenshot a specific element (PNG)
        header = await tab.find(tag_name='header')
        await header.take_screenshot('header.png', quality=100)
        
        # Screenshot a form (JPEG)
        form = await tab.find(id='login-form')
        await form.take_screenshot('login-form.jpeg', quality=85)
        
        # Screenshot a chart or graph (WebP)
        chart = await tab.find(class_name='data-visualization')
        await chart.take_screenshot('chart.webp', quality=90)
```

!!! info "Format Detection"
    The image format is automatically detected from the file extension (`.png`, `.jpeg`/`.jpg`, or `.webp`). Using an unsupported extension raises `InvalidFileExtension`.

!!! tip "Automatic Scrolling"
    When capturing element screenshots, Pydoll automatically scrolls the element into view before taking the screenshot.

### Element vs Page Screenshots

| Feature | `tab.take_screenshot()` | `element.take_screenshot()` |
|---------|------------------------|----------------------------|
| **Scope** | Entire viewport or page | Specific element only |
| **Format Support** | PNG, JPEG, WebP | PNG, JPEG, WebP |
| **Beyond Viewport** | ✅ Supported | ❌ Not applicable |
| **Base64 Output** | ✅ Supported | ✅ Supported |
| **Auto-Scroll** | ❌ Not applicable | ✅ Yes |
| **Use Case** | Full page captures | Component isolation, testing |


## PDF Generation

### Basic PDF Export

Convert pages to PDF with print-quality output:

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def generate_pdf():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/document')
        
        # Generate PDF with Path
        await tab.print_to_pdf(Path('document.pdf'))
        
        # Or with string
        await tab.print_to_pdf('document.pdf')

asyncio.run(generate_pdf())
```

### PDF Parameters

| Parameter | Type | Default | Description |
|-----------|------|---------|-------------|
| `path` | `Optional[str \| Path]` | `None` | File path to save PDF. Required if `as_base64=False`. |
| `landscape` | `bool` | `False` | Use landscape orientation (vs portrait). |
| `display_header_footer` | `bool` | `False` | Include browser-generated header/footer with title, URL, page numbers. |
| `print_background` | `bool` | `True` | Include background graphics and colors. |
| `scale` | `float` | `1.0` | Page scale factor (0.1-2.0). Useful for zoom/shrink effects. |
| `as_base64` | `bool` | `False` | Return base64-encoded string instead of saving to file. |

!!! tip "Path vs String"
    While `Path` objects from `pathlib` are recommended as best practice for better path handling and cross-platform compatibility, you can also use plain strings if preferred.

### Advanced PDF Options

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def advanced_pdf():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/report')
        
        # Landscape PDF with headers/footers
        await tab.print_to_pdf(
            Path('report-landscape.pdf'),
            landscape=True,
            display_header_footer=True,
            print_background=True,
            scale=0.9
        )
        
        # Portrait PDF without backgrounds (ink-friendly)
        await tab.print_to_pdf(
            Path('report-ink-friendly.pdf'),
            landscape=False,
            print_background=False,
            scale=1.0
        )

asyncio.run(advanced_pdf())
```

### PDF Scale Factor

Control the zoom level of PDF output:

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def scaled_pdfs():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/content')
        
        # Shrink content to fit more on each page
        await tab.print_to_pdf(Path('compact.pdf'), scale=0.7)
        
        # Normal scale
        await tab.print_to_pdf(Path('normal.pdf'), scale=1.0)
        
        # Enlarge content (fewer pages)
        await tab.print_to_pdf(Path('large.pdf'), scale=1.5)

asyncio.run(scaled_pdfs())
```

!!! warning "Scale Limits"
    The `scale` parameter accepts values between `0.1` and `2.0`. Values outside this range may produce unexpected results.

### Base64 PDF

Generate PDF as base64 string for API transmission:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def base64_pdf():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/invoice')
        
        # Get PDF as base64 (no path needed)
        pdf_base64 = await tab.print_to_pdf(as_base64=True)
        
        # Send via API
        import aiohttp
        async with aiohttp.ClientSession() as session:
            await session.post(
                'https://api.example.com/invoices',
                json={'pdf': pdf_base64}
            )

asyncio.run(base64_pdf())
```


!!! info "CDP Reference"
    For complete CDP documentation on these commands, see:
    
    - [Page.captureScreenshot](https://chromedevtools.github.io/devtools-protocol/tot/Page/#method-captureScreenshot)
    - [Page.printToPDF](https://chromedevtools.github.io/devtools-protocol/tot/Page/#method-printToPDF)

### Error Handling

```python
from pydoll.exceptions import (
    InvalidFileExtension,
    MissingScreenshotPath,
    TopLevelTargetRequired
)

async def safe_screenshot():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        try:
            # Missing path and as_base64=False
            await tab.take_screenshot()
        except MissingScreenshotPath:
            print("Error: Must provide path or set as_base64=True")
        
        try:
            # Invalid extension
            await tab.take_screenshot('image.bmp')
        except InvalidFileExtension as e:
            print(f"Error: {e}")
        
        # IFrame screenshot limitation
        iframe_element = await tab.find(tag_name='iframe')

        # This still won't work: top-level screenshots ignore iframe content
        # await tab.take_screenshot('frame.png')

        # Screenshot an element inside the iframe WebElement
        content = await iframe_element.find(id='content')
        await content.take_screenshot('iframe-content.png')
```

## Page Bundle Export

Save an entire page with all its assets (CSS, JS, images, fonts) as a `.zip` archive for offline viewing.

### Basic Usage

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def save_page():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')

        # Save page with assets as separate files
        await tab.save_bundle('page.zip')

asyncio.run(save_page())
```

The resulting zip contains an `index.html` with all URLs rewritten to reference local files under an `assets/` directory.

### Inline Mode

Embed everything directly into a single `index.html` using data URIs, `<style>`, and `<script>` tags:

```python
# Single self-contained HTML file inside the zip
await tab.save_bundle('page-inline.zip', inline_assets=True)
```

### Parameters

| Parameter | Type | Default | Description |
|-----------|------|---------|-------------|
| `path` | `str \| Path` | *(required)* | Destination path. Must end with `.zip`. |
| `inline_assets` | `bool` | `False` | Embed all assets inline instead of saving as separate files. |

!!! info "What Gets Bundled"
    The bundle includes resources of type: Document, Stylesheet, Script, Image, Font, and Media. Resources that failed to load, were canceled, or use `data:` URIs are automatically skipped.

## Learn More

For additional context on how screenshots and PDFs integrate with Pydoll's architecture:

- **[Deep Dive: CDP](../../deep-dive/cdp.md)**: Understanding Chrome DevTools Protocol commands
- **[API Reference: Tab](../../api/browser/tab.md#take_screenshot)**: Complete method signatures and parameters
- **[API Reference: WebElement](../../api/elements/web-element.md#take_screenshot)**: Element-specific screenshot capabilities

Screenshots and PDFs are essential tools for automation, testing, and documentation. Pydoll's direct CDP integration provides professional-grade output with fine-grained control.


================================================
FILE: docs/en/features/browser-management/contexts.md
================================================
# Browser Contexts

Browser Contexts are Pydoll's solution for creating completely isolated browsing environments within a single browser process. Think of them as separate "incognito windows" but with full programmatic control, each context maintains its own cookies, storage, cache, and authentication state.

## Quick Start

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def basic_context_example():
    async with Chrome() as browser:
        # Start browser with initial tab in default context
        initial_tab = await browser.start()
        await initial_tab.go_to('https://example.com')
        
        # Create isolated context
        context_id = await browser.create_browser_context()
        
        # New tab in isolated context
        isolated_tab = await browser.new_tab('https://example.com', browser_context_id=context_id)
        
        # Both tabs are completely isolated - different cookies, storage, etc.
        await initial_tab.execute_script("localStorage.setItem('user', 'Alice')")
        await isolated_tab.execute_script("localStorage.setItem('user', 'Bob')")
        
        # Verify isolation
        user_default = await initial_tab.execute_script("return localStorage.getItem('user')")
        user_isolated = await isolated_tab.execute_script("return localStorage.getItem('user')")
        
        print(f"Default context: {user_default}")  # Alice
        print(f"Isolated context: {user_isolated}")  # Bob

asyncio.run(basic_context_example())
```

## What Are Browser Contexts?

A browser context is an isolated browsing environment within a single browser process. Each context maintains completely separate:

| Component | Description | Isolation Level |
|-----------|-------------|-----------------|
| **Cookies** | HTTP cookies and session data | ✓ Fully isolated |
| **Local Storage** | `localStorage` and `sessionStorage` | ✓ Fully isolated |
| **IndexedDB** | Client-side database | ✓ Fully isolated |
| **Cache** | HTTP cache and resources | ✓ Fully isolated |
| **Permissions** | Geolocation, notifications, camera, etc. | ✓ Fully isolated |
| **Authentication** | Login sessions and auth tokens | ✓ Fully isolated |
| **Service Workers** | Background scripts | ✓ Fully isolated |

```mermaid
graph LR
    Browser[Browser Process] --> Default[Default Context]
    Browser --> Context1[Context 1]
    Browser --> Context2[Context 2]
    
    Default --> T1[Tab A]
    Default --> T2[Tab B]
    Context1 --> T3[Tab C]
    Context2 --> T4[Tab D]
```

## Why Use Browser Contexts?

### 1. Multi-Account Testing

Test different user accounts simultaneously without interference:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def perform_login(tab, email, password):
    """
    Helper function to navigate to the login page
    and submit account credentials.
    """
    print(f"Attempting login with: {email}...")
    await tab.go_to('https://app.example.com/login')

    # Find elements
    email_field = await tab.find(id='email')
    password_field = await tab.find(id='password')
    login_btn = await tab.find(id='login-btn')

    # Fill credentials and click
    await email_field.type_text(email)
    await password_field.type_text(password)
    await login_btn.click()

    # Wait for login to process
    await asyncio.sleep(2)
    print(f"Login successful for {email}.")


async def multi_account_test():
    """
    Main script to test simultaneous logins
    using isolated browser contexts.
    """
    accounts = [
        {"email": "user1@example.com", "password": "pass1"},
        {"email": "user2@example.com", "password": "pass2"},
        {"email": "admin@example.com", "password": "admin_pass"}
    ]

    # This list will store information for each active user session.
    user_sessions = []

    async with Chrome() as browser:
        first_account = accounts[0]
        initial_tab = await browser.start()
        await perform_login(initial_tab, first_account['email'], first_account['password'])
        user_sessions.append({
            "email": first_account['email'],
            "tab": initial_tab,
            "context_id": None  # 'None' represents the default browser context
        })

        # Iterate over the rest of the accounts
        for account in accounts[1:]:
            context_id = await browser.create_browser_context()
            new_tab = await browser.new_tab(browser_context_id=context_id)
            await perform_login(new_tab, account['email'], account['password'])

            # Add this new session info to the list
            user_sessions.append({
                "email": account['email'],
                "tab": new_tab,
                "context_id": context_id
            })

        print("\n--- Verifying all active sessions ---")
        for session in user_sessions:
            tab = session["tab"]
            email = session["email"]
            await tab.go_to('https://app.example.com/dashboard')
            username = await tab.find(class_name='username')
            username_text = await username.text
            print(f"[Account: {email}] -> Logged in as: {username_text}")
            await asyncio.sleep(0.5)

        print("\n--- Cleaning up contexts ---")
        for session in user_sessions:
            # Only close contexts we created (non-None)
            if session["context_id"] is not None:
                print(f"Closing context for: {session['email']}")
                await session["tab"].close()
                await browser.delete_browser_context(session["context_id"])
        
        # The default context (None) is closed automatically
        # by the 'async with Chrome() as browser'

asyncio.run(multi_account_test())
```

### 2. Geo-Location Testing with Context-Specific Proxies

Each context can have its own proxy configuration:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def geo_location_testing():
    async with Chrome() as browser:
        # Start browser and use initial tab for first test (default context, no proxy)
        initial_tab = await browser.start()
        await initial_tab.go_to('https://api.ipify.org')
        await asyncio.sleep(2)
        default_ip = await initial_tab.execute_script('return document.body.textContent')
        print(f"Default IP (no proxy): {default_ip}")
        
        # US context with US proxy
        us_context = await browser.create_browser_context(
            proxy_server='http://us-proxy.example.com:8080'
        )
        us_tab = await browser.new_tab('https://api.ipify.org', browser_context_id=us_context)
        await asyncio.sleep(2)
        us_ip = await us_tab.execute_script('return document.body.textContent')
        print(f"US IP: {us_ip}")
        
        # EU context with EU proxy
        eu_context = await browser.create_browser_context(
            proxy_server='http://eu-proxy.example.com:8080'
        )
        eu_tab = await browser.new_tab('https://api.ipify.org', browser_context_id=eu_context)
        await asyncio.sleep(2)
        eu_ip = await eu_tab.execute_script('return document.body.textContent')
        print(f"EU IP: {eu_ip}")
        
        # Cleanup (skip initial tab)
        await us_tab.close()
        await eu_tab.close()
        await browser.delete_browser_context(us_context)
        await browser.delete_browser_context(eu_context)

asyncio.run(geo_location_testing())
```

!!! tip "Proxy Authentication"
    Pydoll handles proxy authentication automatically for contexts. Just include credentials in the URL:
    ```python
    context_id = await browser.create_browser_context(
        proxy_server='http://username:password@proxy.example.com:8080'
    )
    ```
    The credentials are sanitized from CDP commands and only used when the browser challenges for auth.

### 3. A/B Testing

Compare different user experiences in parallel:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def ab_testing():
    async with Chrome() as browser:
        # Start browser with initial tab (Control group in default context)
        initial_tab = await browser.start()
        await initial_tab.go_to('https://example.com')
        await initial_tab.execute_script("localStorage.setItem('experiment', 'control')")
        
        # Treatment group in isolated context
        context_b = await browser.create_browser_context()
        tab_b = await browser.new_tab('https://example.com', browser_context_id=context_b)
        await tab_b.execute_script("localStorage.setItem('experiment', 'treatment')")
        
        # Navigate both to the feature page
        await initial_tab.go_to('https://example.com/feature')
        await tab_b.go_to('https://example.com/feature')
        
        # Compare results
        result_a = await initial_tab.find(class_name='experiment-result')
        result_b = await tab_b.find(class_name='experiment-result')
        
        print(f"Control group result: {await result_a.text}")
        print(f"Treatment group result: {await result_b.text}")
        
        # Cleanup
        await tab_b.close()
        await browser.delete_browser_context(context_b)

asyncio.run(ab_testing())
```

### 4. Parallel Web Scraping

Scrape multiple sites with different configurations:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def parallel_scraping():
    websites = [
        {'url': 'https://news.ycombinator.com', 'selector': '.storylink'},
        {'url': 'https://reddit.com/r/python', 'selector': '.title'},
        {'url': 'https://github.com/trending', 'selector': '.h3'},
    ]
    
    async with Chrome() as browser:
        # Start browser and get initial tab
        initial_tab = await browser.start()
        
        # Create contexts for remaining sites (first uses default context)
        contexts = [None] + [await browser.create_browser_context() for _ in websites[1:]]
        
        # Create tabs (reusing initial tab for first site)
        tabs = [initial_tab] + [
            await browser.new_tab(browser_context_id=ctx) for ctx in contexts[1:]
        ]
        
        async def scrape_site(tab, site, context_id):
            """Scrape a single site within the given tab and context."""
            try:
                await tab.go_to(site['url'])
                await asyncio.sleep(3)
                
                # Extract titles using CSS selector
                elements = await tab.query(site['selector'], find_all=True)
                titles = [await elem.text for elem in elements[:5]]
                
                return {'url': site['url'], 'titles': titles}
            finally:
                # Clean up context (skip default context for initial tab)
                if context_id is not None:
                    await tab.close()
                    await browser.delete_browser_context(context_id)
        
        # Scrape all sites concurrently
        results = await asyncio.gather(*[
            scrape_site(tab, site, ctx) for tab, site, ctx in zip(tabs, websites, contexts)
        ])
        
        # Display results
        for result in results:
            print(f"\n{result['url']}:")
            for i, title in enumerate(result['titles'], 1):
                print(f"  {i}. {title}")

asyncio.run(parallel_scraping())
```

## Understanding Context Performance

### Contexts Are Lightweight

!!! info "Performance Characteristics"
    Creating a browser context is **significantly faster and lighter** than launching a new browser process:
    
    - **Context creation**: ~50-100ms, minimal memory overhead
    - **New browser process**: ~2-5 seconds, 50-150 MB base memory
    
    For 10 isolated environments:

    - **10 contexts in 1 browser**: ~500ms startup, ~500 MB total
    - **10 separate browsers**: ~30 seconds startup, ~1-1.5 GB total

```python
import asyncio
import time
from pydoll.browser.chromium import Chrome

async def benchmark_contexts_vs_browsers():
    # Benchmark contexts
    start = time.time()
    async with Chrome() as browser:
        # Start browser (initial tab not used in this example)
        await browser.start()
        
        contexts = []
        for i in range(10):
            context_id = await browser.create_browser_context()
            contexts.append(context_id)
        
        print(f"10 contexts created in: {time.time() - start:.2f}s")
        
        # Cleanup
        for context_id in contexts:
            await browser.delete_browser_context(context_id)

asyncio.run(benchmark_contexts_vs_browsers())
```

### Headless vs Headed: The Window Behavior

!!! warning "Important: Context Windows in Headed Mode"
    When running in **headed mode** (visible browser UI), there's an important behavior to understand:
    
    **The first tab created in a new context will open a new OS window.**
    
    - This happens because the context needs a "host window" to render its first page
    - Subsequent tabs in that context can open as tabs within that window
    - This is a CDP/Chromium limitation, not a Pydoll design choice
    
    **In headless mode**, this doesn't matter—no windows are created, everything runs in the background.

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def demonstrate_window_behavior():
    # Headed mode - will see windows
    options_headed = ChromiumOptions()
    options_headed.headless = False
    
    async with Chrome(options=options_headed) as browser:
        # Start browser with initial tab (opens first window in default context)
        initial_tab = await browser.start()
        await initial_tab.go_to('https://example.com')
        
        # Create new context - first tab will open a NEW window
        context = await browser.create_browser_context()
        tab2 = await browser.new_tab('https://github.com', browser_context_id=context)
        
        # Second tab in same context - opens as tab in existing window
        tab3 = await browser.new_tab('https://google.com', browser_context_id=context)
        
        await asyncio.sleep(10)  # Observe the windows
        
        await tab2.close()
        await tab3.close()
        await browser.delete_browser_context(context)

# Headless mode - no windows, contexts are invisible but still isolated
async def headless_contexts():
    options = ChromiumOptions()
    options.headless = True  # No visible windows
    
    async with Chrome(options=options) as browser:
        # Start browser with initial tab in default context
        initial_tab = await browser.start()
        await initial_tab.go_to('https://example.com/page0')
        
        # Create 4 more contexts - no windows opened, all in background
        contexts = []
        for i in range(1, 5):
            context_id = await browser.create_browser_context()
            tab = await browser.new_tab(f'https://example.com/page{i}', browser_context_id=context_id)
            contexts.append((context_id, tab))
        
        print(f"Created {len(contexts) + 1} isolated contexts (1 default + {len(contexts)} custom, invisible)")
        
        # Cleanup
        for context_id, tab in contexts:
            await tab.close()
            await browser.delete_browser_context(context_id)

asyncio.run(headless_contexts())
```

!!! tip "Best Practice: Use Headless for Contexts"
    For maximum efficiency with multiple contexts:
    
    - **Development/Debugging**: Use headed mode to see what's happening
    - **Production/CI/CD**: Use headless mode for faster, lighter execution
    - **Multiple contexts**: Strongly prefer headless to avoid window management complexity

## Context Management

### Creating Contexts

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def create_context_example():
    async with Chrome() as browser:
        await browser.start()
        
        # Create basic context
        context_id = await browser.create_browser_context()
        print(f"Created context: {context_id}")
        
        # Create context with proxy
        proxied_context = await browser.create_browser_context(
            proxy_server='http://proxy.example.com:8080',
            proxy_bypass_list='localhost,127.0.0.1'
        )
        print(f"Created proxied context: {proxied_context}")
        
        # Create context with authenticated proxy
        auth_context = await browser.create_browser_context(
            proxy_server='http://user:pass@proxy.example.com:8080'
        )
        print(f"Created auth context: {auth_context}")

asyncio.run(create_context_example())
```

### Listing Contexts

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def list_contexts():
    async with Chrome() as browser:
        await browser.start()
        
        # Get all contexts (includes default)
        contexts = await browser.get_browser_contexts()
        print(f"Initial contexts: {len(contexts)}")  # Usually 1 (default)
        
        # Create additional contexts
        context1 = await browser.create_browser_context()
        context2 = await browser.create_browser_context()
        
        # List again
        contexts = await browser.get_browser_contexts()
        print(f"After creating 2 new contexts: {len(contexts)}")  # 3 total
        
        for i, context_id in enumerate(contexts):
            print(f"  Context {i+1}: {context_id}")
        
        # Cleanup
        await browser.delete_browser_context(context1)
        await browser.delete_browser_context(context2)

asyncio.run(list_contexts())
```

### Deleting Contexts

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def delete_context_example():
    async with Chrome() as browser:
        await browser.start()
        
        # Create context with tabs
        context_id = await browser.create_browser_context()
        tab1 = await browser.new_tab('https://example.com', browser_context_id=context_id)
        tab2 = await browser.new_tab('https://github.com', browser_context_id=context_id)
        
        print(f"Created context {context_id} with 2 tabs")
        
        # Deleting context closes all its tabs automatically
        await browser.delete_browser_context(context_id)
        print("Context deleted (all tabs closed automatically)")

asyncio.run(delete_context_example())
```

!!! warning "Deleting Contexts Closes All Tabs"
    When you delete a browser context, **all tabs belonging to that context are automatically closed**. This is an efficient way to clean up multiple tabs at once, but make sure you've saved any important data first.

## Default Context

Every browser starts with a **default context** that contains the initial tab:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def default_context_example():
    async with Chrome() as browser:
        # Initial tab is in the default context
        initial_tab = await browser.start()
        
        # Create tab without specifying context - uses default
        default_tab = await browser.new_tab('https://example.com')
        
        # Create custom context
        custom_context = await browser.create_browser_context()
        custom_tab = await browser.new_tab('https://github.com', browser_context_id=custom_context)
        
        # Default and custom contexts are isolated
        await default_tab.execute_script("localStorage.setItem('type', 'default')")
        await custom_tab.execute_script("localStorage.setItem('type', 'custom')")
        
        # Verify isolation
        default_type = await default_tab.execute_script("return localStorage.getItem('type')")
        custom_type = await custom_tab.execute_script("return localStorage.getItem('type')")
        
        print(f"Default context: {default_type}")  # 'default'
        print(f"Custom context: {custom_type}")    # 'custom'
        
        # Cleanup custom context
        await browser.delete_browser_context(custom_context)

asyncio.run(default_context_example())
```

!!! info "You Cannot Delete the Default Context"
    The default browser context is permanent and cannot be deleted. It exists for the entire browser session. Only custom contexts created with `create_browser_context()` can be deleted.

## Advanced Patterns

### Context Pool for Reusable Isolation

```python
import asyncio
from pydoll.browser.chromium import Chrome

class ContextPool:
    def __init__(self, browser, size=5):
        self.browser = browser
        self.size = size
        self.contexts = []
        self.in_use = set()
    
    async def initialize(self):
        """Create pool of contexts"""
        for _ in range(self.size):
            context_id = await self.browser.create_browser_context()
            self.contexts.append(context_id)
        print(f"Context pool initialized with {self.size} contexts")
    
    async def acquire(self):
        """Get available context from pool"""
        for context_id in self.contexts:
            if context_id not in self.in_use:
                self.in_use.add(context_id)
                return context_id
        raise Exception("No available contexts in pool")
    
    def release(self, context_id):
        """Return context to pool"""
        self.in_use.discard(context_id)
    
    async def cleanup(self):
        """Delete all contexts in pool"""
        for context_id in self.contexts:
            await self.browser.delete_browser_context(context_id)

async def use_context_pool():
    async with Chrome() as browser:
        await browser.start()
        
        # Create pool
        pool = ContextPool(browser, size=3)
        await pool.initialize()
        
        # Use contexts from pool
        async def scrape_with_pool(url):
            context_id = await pool.acquire()
            try:
                tab = await browser.new_tab(url, browser_context_id=context_id)
                await asyncio.sleep(2)
                title = await tab.execute_script('return document.title')
                await tab.close()
                return title
            finally:
                pool.release(context_id)
        
        # Scrape multiple URLs using the pool
        urls = [f'https://example.com/page{i}' for i in range(10)]
        results = await asyncio.gather(*[scrape_with_pool(url) for url in urls])
        
        for i, title in enumerate(results):
            print(f"{urls[i]}: {title}")
        
        # Cleanup
        await pool.cleanup()

asyncio.run(use_context_pool())
```

### Per-Context Configuration Manager

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def context_config_manager():
    async with Chrome() as browser:
        await browser.start()
        
        # Define configurations for different scenarios
        configs = {
            'us_user': {
                'proxy': 'http://us-proxy.example.com:8080',
                'user_agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64)'
            },
            'eu_user': {
                'proxy': 'http://eu-proxy.example.com:8080',
                'user_agent': 'Mozilla/5.0 (X11; Linux x86_64)'
            },
            'mobile_user': {
                'proxy': None,
                'user_agent': 'Mozilla/5.0 (iPhone; CPU iPhone OS 14_0 like Mac OS X)'
            }
        }
        
        contexts = {}
        
        # Create context for each configuration
        for name, config in configs.items():
            if config['proxy']:
                context_id = await browser.create_browser_context(
                    proxy_server=config['proxy']
                )
            else:
                context_id = await browser.create_browser_context()
            
            # Create tab and set user agent
            tab = await browser.new_tab(browser_context_id=context_id)
            # Note: User agent would be set via CDP or options, simplified here
            
            contexts[name] = {'context_id': context_id, 'tab': tab}
        
        # Use different contexts for different scenarios
        for name, data in contexts.items():
            tab = data['tab']
            await tab.go_to('https://httpbin.org/headers')
            await asyncio.sleep(2)
            print(f"\n{name} configuration active")
        
        # Cleanup
        for data in contexts.values():
            await data['tab'].close()
            await browser.delete_browser_context(data['context_id'])

asyncio.run(context_config_manager())
```

## Best Practices

1. **Use headless mode for multiple contexts** to avoid window management complexity
2. **Always delete contexts when done** to prevent memory leaks
3. **Group related operations in the same context** for better organization
4. **Prefer contexts over multiple browser processes** for better performance
5. **Use context pools** for scenarios requiring many short-lived isolated environments
6. **Close tabs before deleting contexts** for cleaner cleanup (though not strictly required)

## See Also

- **[Multi-Tab Management](tabs.md)** - Managing multiple tabs within contexts
- **[Deep Dive: Browser Domain](../../deep-dive/browser-domain.md)** - Architectural details on contexts
- **[Network: HTTP Requests](../network/http-requests.md)** - Browser-context requests inherit context state
- **[Core Concepts](../core-concepts.md)** - Understanding Pydoll's architecture

Browser Contexts are one of Pydoll's most powerful features for creating sophisticated automation workflows. By understanding how they work—especially the window behavior in headed mode and their lightweight nature—you can build efficient, scalable automation that handles complex multi-environment scenarios with ease.


================================================
FILE: docs/en/features/browser-management/cookies-sessions.md
================================================
# Cookies & Sessions

Managing cookies and sessions effectively is crucial for realistic browser automation. Websites use cookies to track authentication, preferences, and user behavior, and they expect browsers to behave accordingly.

## Why Cookies Matter for Automation

Cookies are more than just stored data: they're a fingerprint of browser activity:

- **Authentication**: Session cookies maintain login state across requests
- **Tracking Prevention**: Anti-bot systems analyze cookie patterns
- **Realistic Behavior**: A browser without cookies looks suspicious
- **Session Persistence**: Reusing cookies can save time on repeated logins

!!! warning "The Cookie Paradox"
    - **Too clean**: A browser with no cookies or history appears bot-like
    - **Too stale**: Using the same session for weeks triggers security alerts
    - **Sweet spot**: Fresh cookies with occasional rotation and realistic activity patterns

## Quick Start

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def basic_cookie_management():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # Set a cookie (using a simple dict)
        cookies = [
            {
                'name': 'session_id',
                'value': 'abc123xyz',
                'domain': 'example.com',
                'path': '/',
                'secure': True,
                'httpOnly': True
            }
        ]
        await tab.set_cookies(cookies)
        
        # Get all cookies
        all_cookies = await browser.get_cookies()
        print(f"Total cookies: {len(all_cookies)}")
        
        # Delete all cookies
        await tab.delete_all_cookies()

asyncio.run(basic_cookie_management())
```

## Understanding Cookie Types

!!! info "TypedDict: Use Regular Dicts in Practice"
    Throughout this documentation, you'll see references to `CookieParam` and `Cookie`. These are **TypedDict** types, they're just regular Python dicts with type hints for IDE autocomplete and type checking.
    
    **In practice, you use regular dicts:**
    ```python
    # This is what you actually write:
    cookie = {'name': 'session', 'value': 'abc123', 'domain': 'example.com'}
    
    # The type annotation is just for your IDE:
    from pydoll.protocol.network.types import CookieParam
    cookie: CookieParam = {'name': 'session', 'value': 'abc123'}
    ```
    
    All examples below use plain dicts for simplicity.

### Cookie Structure

The `Cookie` type (retrieved from browser) contains full cookie information:

```python
{
    "name": str,           # Cookie name
    "value": str,          # Cookie value
    "domain": str,         # Domain where cookie is valid
    "path": str,           # Path where cookie is valid
    "expires": float,      # Unix timestamp (0 = session cookie)
    "size": int,           # Size in bytes
    "httpOnly": bool,      # Accessible only via HTTP (not JavaScript)
    "secure": bool,        # Sent only over HTTPS
    "session": bool,       # True if expires when browser closes
    "sameSite": str,       # "Strict", "Lax", or "None"
    "priority": str,       # "Low", "Medium", or "High"
    "sourceScheme": str,   # "Unset", "NonSecure", or "Secure"
    "sourcePort": int,     # Port where cookie was set
}
```

### CookieParam Structure

When **setting** cookies, use a dict (only `name` and `value` are required):

```python
# Simple cookie with just required fields
cookie = {
    'name': 'user_token',
    'value': 'token_value'
}

# Full cookie with all optional fields
cookie = {
    'name': 'user_token',       # Required
    'value': 'token_value',     # Required
    'domain': 'example.com',    # Optional: defaults to current page domain
    'path': '/',                # Optional: defaults to /
    'secure': True,             # Optional: HTTPS only
    'httpOnly': True,           # Optional: no JS access
    'sameSite': 'Lax',          # Optional: 'Strict', 'Lax', or 'None'
    'expires': 1735689600,      # Optional: Unix timestamp
    'priority': 'High',         # Optional: 'Low', 'Medium', or 'High'
}
```

!!! info "Optional Fields Default Behavior"
    When you omit optional fields:
    
    - `domain`: Uses the domain of the current page
    - `path`: Defaults to `/`
    - `secure`: Defaults to `False`
    - `httpOnly`: Defaults to `False`
    - `sameSite`: Browser's default (usually `Lax`)
    - `expires`: Session cookie (deleted when browser closes)

## Cookie Management Operations

### Setting Cookies

#### Set Multiple Cookies at Once

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def set_multiple_cookies():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        cookies = [
            {
                'name': 'session_id',
                'value': 'xyz789',
                'domain': 'example.com',
                'secure': True,
                'httpOnly': True,
                'sameSite': 'Strict'
            },
            {
                'name': 'preferences',
                'value': 'dark_mode=true',
                'domain': 'example.com',
                'path': '/settings'
            },
            {
                'name': 'analytics',
                'value': 'tracking_id_12345',
                'domain': 'example.com',
                'expires': 1735689600  # Expires on specific date
            }
        ]
        
        await tab.set_cookies(cookies)
        print(f"Set {len(cookies)} cookies")

asyncio.run(set_multiple_cookies())
```

#### Set Cookies in Specific Context

```python
# Set cookies in a specific browser context
context_id = await browser.create_browser_context()
await browser.set_cookies(cookies, browser_context_id=context_id)
```

!!! tip "Tab vs Browser Methods for Setting Cookies"
    - `tab.set_cookies(cookies)`: Sets cookies in the tab's browser context (convenient shortcut)
    - `browser.set_cookies(cookies, browser_context_id=...)`: Sets cookies with explicit context control
    
    Both methods add cookies to the **entire context**, not just the current page. The cookies will be available to all tabs in that context.

### Retrieving Cookies

#### Get All Cookies (Context-Wide)

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def get_cookies_example():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://github.com')
        
        # Wait for page to set cookies
        await asyncio.sleep(2)
        
        # Option 1: Get cookies via tab (shortcut for current context)
        cookies = await tab.get_cookies()
        
        # Option 2: Get cookies via browser (explicit context control)
        # cookies = await browser.get_cookies()  # Same as tab.get_cookies() for default context
        
        print(f"Found {len(cookies)} cookies:")
        for cookie in cookies:
            print(f"  - {cookie['name']}: {cookie['value'][:20]}...")
            print(f"    Domain: {cookie['domain']}, Secure: {cookie['secure']}")

asyncio.run(get_cookies_example())
```

!!! tip "Tab vs Browser Methods"
    - `tab.get_cookies()`: Returns cookies from the tab's browser context (convenient shortcut)
    - `browser.get_cookies()`: Returns cookies from the default context (or specify `browser_context_id`)
    
    Both methods return **all cookies** from the context, not just cookies for the current page domain.

!!! warning "Incognito Mode Limitation"
    `browser.get_cookies()` does **not work** with native incognito mode (`--incognito` flag). This is a Chrome DevTools Protocol limitation where `Storage.getCookies` cannot access cookies in native incognito mode.
    
    **Workaround:** Use `tab.get_cookies()` instead, which uses `Network.getCookies` and works correctly in incognito mode.

#### Get Cookies from Specific Context

```python
# Get cookies from specific browser context
context_id = await browser.create_browser_context()
cookies = await browser.get_cookies(browser_context_id=context_id)
```

### Deleting Cookies

#### Delete All Cookies

```python
# Delete all cookies from current tab's context
await tab.delete_all_cookies()

# Delete all cookies from specific context
await browser.delete_all_cookies(browser_context_id=context_id)
```

!!! warning "Cookies Are Deleted Immediately"
    When you delete cookies, they're removed from the browser immediately. The website may not detect this until the next request or page reload.

## Practical Use Cases

### 1. Persistent Login Sessions

Reuse authentication cookies across script runs:

```python
import asyncio
import json
from pathlib import Path
from pydoll.browser.chromium import Chrome

COOKIE_FILE = Path('cookies.json')

async def save_cookies_after_login():
    """Log in and save cookies for future use."""
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/login')
        
        # Perform login (simplified)
        email = await tab.find(id='email')
        password = await tab.find(id='password')
        await email.type_text('user@example.com')
        await password.type_text('secret')
        
        login_btn = await tab.find(id='login')
        await login_btn.click()
        await asyncio.sleep(3)
        
        # Save cookies
        cookies = await browser.get_cookies()
        COOKIE_FILE.write_text(json.dumps(cookies, indent=2))
        print(f"Saved {len(cookies)} cookies to {COOKIE_FILE}")

async def reuse_saved_cookies():
    """Load saved cookies to skip login."""
    if not COOKIE_FILE.exists():
        print("No saved cookies found. Run save_cookies_after_login() first.")
        return
    
    # Load cookies from file
    saved_cookies = json.loads(COOKIE_FILE.read_text())
    
    # Convert to simplified format (only required fields)
    # Note: get_cookies() returns detailed Cookie objects with read-only fields
    # (size, session, sourceScheme, etc.). set_cookies() expects CookieParam
    # format with only the settable fields.
    cookies_to_set = [
        {
            'name': c['name'],
            'value': c['value'],
            'domain': c['domain'],
            'path': c.get('path', '/'),
            'secure': c.get('secure', False),
            'httpOnly': c.get('httpOnly', False)
        }
        for c in saved_cookies
    ]
    
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Set cookies before navigating
        await tab.set_cookies(cookies_to_set)
        print(f"Loaded {len(cookies_to_set)} cookies from file")
        
        # Navigate - should be logged in already
        await tab.go_to('https://example.com/dashboard')
        await asyncio.sleep(2)
        
        # Verify login
        try:
            username = await tab.find(class_name='username')
            print(f"Logged in as: {await username.text}")
        except Exception:
            print("Login failed - cookies may have expired")

# First run: log in and save cookies
# asyncio.run(save_cookies_after_login())

# Subsequent runs: reuse cookies
asyncio.run(reuse_saved_cookies())
```

!!! note "Cookie Reformatting Required"
    `get_cookies()` returns **detailed `Cookie` objects** with read-only attributes like `size`, `session`, `sourceScheme`, and `sourcePort`. When using `set_cookies()`, you must provide **`CookieParam` format** containing only the settable fields (`name`, `value`, `domain`, `path`, `secure`, `httpOnly`, `sameSite`, `expires`, `priority`).
    
    The reformatting step in the example above is **essential**. Passing raw `Cookie` objects to `set_cookies()` may cause errors or unexpected behavior.

!!! tip "Cookie Expiration"
    Always check if saved cookies have expired. Session cookies (`session=True`) expire when the browser closes, while persistent cookies have an `expires` timestamp you can validate.

### 2. Multi-Account Testing with Isolated Cookies

Each browser context maintains separate cookies:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def test_multiple_accounts():
    accounts = [
        {'email': 'user1@example.com', 'cookie_value': 'session_user1'},
        {'email': 'user2@example.com', 'cookie_value': 'session_user2'},
    ]
    
    async with Chrome() as browser:
        initial_tab = await browser.start()
        
        # First account in default context
        cookies_user1 = [{
            'name': 'session',
            'value': accounts[0]['cookie_value'],
            'domain': 'example.com',
            'secure': True,
            'httpOnly': True
        }]
        await initial_tab.set_cookies(cookies_user1)
        await initial_tab.go_to('https://example.com/dashboard')
        
        # Second account in isolated context
        context2 = await browser.create_browser_context()
        tab2 = await browser.new_tab(browser_context_id=context2)
        
        cookies_user2 = [{
            'name': 'session',
            'value': accounts[1]['cookie_value'],
            'domain': 'example.com',
            'secure': True,
            'httpOnly': True
        }]
        await browser.set_cookies(cookies_user2, browser_context_id=context2)
        await tab2.go_to('https://example.com/dashboard')
        
        # Both users are logged in simultaneously with different sessions
        print("User 1 and User 2 logged in with isolated cookies")
        
        await asyncio.sleep(5)
        
        # Cleanup
        await tab2.close()
        await browser.delete_browser_context(context2)

asyncio.run(test_multiple_accounts())
```

### 3. Cookie Rotation for Long-Running Scripts

Refresh cookies periodically to avoid detection:

```python
import asyncio
import time
from pydoll.browser.chromium import Chrome

async def scrape_with_cookie_rotation():
    urls = [f'https://example.com/page{i}' for i in range(100)]
    
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Log in initially
        await tab.go_to('https://example.com/login')
        # ... perform login ...
        await asyncio.sleep(2)
        
        last_rotation = time.time()
        rotation_interval = 600  # Rotate every 10 minutes
        
        for url in urls:
            # Check if it's time to rotate cookies
            if time.time() - last_rotation > rotation_interval:
                print("Rotating session...")
                
                # Delete old cookies
                await tab.delete_all_cookies()
                
                # Re-login or load fresh cookies
                await tab.go_to('https://example.com/login')
                # ... perform login again ...
                
                last_rotation = time.time()
            
            # Scrape page
            await tab.go_to(url)
            await asyncio.sleep(2)
            # ... extract data ...

asyncio.run(scrape_with_cookie_rotation())
```

!!! tip "Rotation Frequency"
    The ideal rotation frequency depends on your use case:
    
    - **High-security sites**: Rotate every 5-15 minutes
    - **Normal sites**: Rotate every 30-60 minutes
    - **Low-risk scraping**: Rotate every few hours


## Cookie Attributes Reference

| Attribute | Type | Description | Default |
|-----------|------|-------------|---------|
| `name` | `str` | Cookie name | *Required* |
| `value` | `str` | Cookie value | *Required* |
| `domain` | `str` | Domain where cookie is valid | Current page domain |
| `path` | `str` | Path where cookie is valid | `/` |
| `secure` | `bool` | Send only over HTTPS | `False` |
| `httpOnly` | `bool` | Not accessible via JavaScript | `False` |
| `sameSite` | `CookieSameSite` | CSRF protection: `Strict`, `Lax`, `None` | Browser default (`Lax`) |
| `expires` | `float` | Unix timestamp (0 = session cookie) | `0` (session) |
| `priority` | `CookiePriority` | Cookie priority: `Low`, `Medium`, `High` | `Medium` |

### SameSite Values

```python
# Use string values directly in your cookie dict:

'sameSite': 'Strict'  # Cookie sent only for same-site requests
'sameSite': 'Lax'     # Cookie sent for top-level navigation (default)
'sameSite': 'None'    # Cookie sent for all requests (requires secure=True)

# Or use the enum for IDE autocomplete:
from pydoll.protocol.network.types import CookieSameSite

cookie = {
    'name': 'session',
    'value': 'xyz',
    'sameSite': CookieSameSite.STRICT  # IDE will autocomplete: STRICT, LAX, NONE
}
```

### Priority Values

```python
# Use string values directly:

'priority': 'Low'     # Low priority (deleted first when space is needed)
'priority': 'Medium'  # Medium priority (default)
'priority': 'High'    # High priority (deleted last)

# Or use the enum:
from pydoll.protocol.network.types import CookiePriority

cookie = {
    'name': 'session',
    'value': 'xyz',
    'priority': CookiePriority.HIGH  # IDE will autocomplete: LOW, MEDIUM, HIGH
}
```

## Common Patterns

### Context Manager for Temporary Cookies

```python
from contextlib import asynccontextmanager

@asynccontextmanager
async def temporary_cookies(browser, tab, cookies):
    """Set cookies, execute code, then restore original cookies."""
    # Save current cookies
    original_cookies = await browser.get_cookies()
    
    try:
        # Set temporary cookies
        await tab.delete_all_cookies()
        await tab.set_cookies(cookies)
        yield tab
    finally:
        # Restore original cookies
        await tab.delete_all_cookies()
        cookies_to_restore = [
            {
                'name': c['name'],
                'value': c['value'],
                'domain': c['domain'],
                'path': c.get('path', '/')
            }
            for c in original_cookies
        ]
        await tab.set_cookies(cookies_to_restore)

# Usage
async with temporary_cookies(browser, tab, test_cookies):
    await tab.go_to('https://example.com')
    # ... perform actions with temporary cookies ...
# Original cookies restored automatically
```

!!! tip "Using Public APIs"
    This context manager accepts both `browser` and `tab` as parameters to use public APIs. Since `tab` doesn't expose its parent `browser` as a public property, passing it explicitly is the recommended approach for accessing browser-level methods.

### Cookie Fingerprint Comparison

```python
def cookie_fingerprint(cookies):
    """Generate a simple fingerprint of cookie state."""
    return {
        'count': len(cookies),
        'domains': set(c['domain'] for c in cookies),
        'names': sorted(c['name'] for c in cookies),
        'secure_count': sum(1 for c in cookies if c.get('secure')),
        'httponly_count': sum(1 for c in cookies if c.get('httpOnly')),
    }

# Compare cookie states
before = await browser.get_cookies()
await tab.go_to('https://example.com')
after = await browser.get_cookies()

print(f"Before: {cookie_fingerprint(before)}")
print(f"After: {cookie_fingerprint(after)}")
```

## Security Considerations

!!! danger "Never Hardcode Sensitive Cookies"
    Always load authentication cookies from secure storage (environment variables, encrypted files, secrets managers).
    
    ```python
    # ❌ Bad - hardcoded in code
    cookies = [{'name': 'session', 'value': 'abc123secret'}]
    
    # ✅ Good - loaded from environment
    import os
    cookies = [{
        'name': 'session',
        'value': os.getenv('SESSION_COOKIE'),
        'domain': os.getenv('COOKIE_DOMAIN')
    }]
    ```

!!! warning "Cookie Theft Protection"
    When saving cookies to disk:
    
    - Use encrypted storage (e.g., `cryptography` library)
    - Set restrictive file permissions
    - Never commit cookie files to version control
    - Rotate cookies regularly

## Best Practices Summary

1. **Start with realistic cookies** - Don't run automation with a completely clean browser
2. **Rotate sessions periodically** - Avoid using the same cookies for extended periods
3. **Respect cookie security attributes** - Use `secure`, `httpOnly`, `sameSite` appropriately
4. **Save and reuse authentication cookies** - Skip repetitive logins when appropriate
5. **Isolate contexts for multi-account testing** - Each context has independent cookies
6. **Monitor cookie evolution** - Real browsing accumulates cookies naturally
7. **Clean up expired cookies** - Remove invalid cookies before reuse
8. **Use secure storage** - Encrypt saved cookies, never hardcode secrets

## See Also

- **[Browser Contexts](contexts.md)** - Isolated cookie environments
- **[HTTP Requests](../network/http-requests.md)** - Browser-context requests inherit cookies automatically
- **[Human-Like Interactions](../automation/human-interactions.md)** - Combine cookies with realistic behavior
- **[API Reference: Storage Commands](/api/commands/storage_commands/)** - Full CDP cookie methods

Effective cookie management is the foundation of realistic browser automation. By balancing freshness with persistence and respecting security attributes, you can build automation that behaves like a real user while remaining efficient and maintainable.


================================================
FILE: docs/en/features/browser-management/tabs.md
================================================
# Multi-Tab Management

Pydoll provides sophisticated multi-tab capabilities that enable complex automation workflows spanning multiple browser tabs simultaneously. Understanding how tabs work in Pydoll is essential for building robust, scalable automation.

## Understanding Tabs in Pydoll

In Pydoll, a `Tab` instance represents a single browser tab (or window) and provides the primary interface for all page automation operations. Each tab maintains its own:

- **Independent execution context**: JavaScript, DOM, and page state
- **Isolated event handlers**: Callbacks registered on one tab don't affect others
- **Separate network monitoring**: Each tab can track its own network activity
- **Unique CDP connection**: Direct WebSocket communication with the browser

```mermaid
graph LR
    Browser[Browser Instance] --> Tab1[Tab 1]
    Browser --> Tab2[Tab 2]
    Browser --> Tab3[...]
    
    Tab1 --> Features1[Independent<br/>Context]
    Tab2 --> Features2[Independent<br/>Context]
```

| Tab Component | Description | Independence |
|---------------|-------------|--------------|
| **Execution Context** | JavaScript runtime, DOM, page state | ✓ Each tab has its own |
| **Event Handlers** | Registered callbacks for CDP events | ✓ Isolated per tab |
| **Network Monitoring** | HTTP requests, responses, timing | ✓ Track separately |
| **CDP Connection** | WebSocket communication channel | ✓ Direct connection |

### What is a Browser Tab?

A browser tab is technically a **CDP target** - an isolated browsing context with its own:

- Document Object Model (DOM)
- JavaScript execution environment
- Network connection pool
- Cookie storage (shared with other tabs in the same context)
- Event loop and rendering engine

Each tab has a unique `target_id` assigned by the browser, which Pydoll uses to route commands and events correctly.

## Tab Instance Management

Pydoll's `Browser` class maintains a registry of Tab instances based on each tab's `target_id`. This ensures that multiple references to the same browser tab always return the same Tab object. The Browser stores these instances in an internal `_tabs_opened` dictionary.

| Benefit | Description |
|---------|-------------|
| **Resource Efficiency** | One Tab instance per browser tab, no duplicates |
| **Consistent State** | All references share the same event handlers and state |
| **Memory Safety** | Prevents multiple WebSocket connections to the same target |
| **Predictable Behavior** | Changes in one reference affect all references |

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def tab_registry_demonstration():
    async with Chrome() as browser:
        # Start the browser with initial tab
        tab1 = await browser.start()

        # Get the same tab through different methods
        # Note: get_opened_tabs() returns tabs in reversed order (newest first)
        # So the initial tab (oldest) is at the end
        opened_tabs = await browser.get_opened_tabs()
        tab2 = opened_tabs[-1]  # Initial tab is the oldest, so it's last

        # Both references point to the same object
        # because Browser returns the same instance from its registry
        print(f"Same instance? {tab1 is tab2}")  # True
        print(f"Same target ID? {tab1._target_id == tab2._target_id}")  # True

        # Registering event on one reference affects the other
        await tab1.enable_network_events()
        print(f"Network events on tab2? {tab2.network_events_enabled}")  # True

        # Browser maintains the registry internally
        print(f"Tab registered in browser? {tab1._target_id in browser._tabs_opened}")  # True

asyncio.run(tab_registry_demonstration())
```

!!! info "Browser-Managed Registry"
    The Browser class manages a `_tabs_opened` dictionary keyed by `target_id`. When you request a tab (via `new_tab()` or `get_opened_tabs()`), the Browser checks this registry first. If a Tab instance already exists for that `target_id`, it returns the existing instance; otherwise, it creates a new one and stores it in the registry. (IFrames no longer create Tab entries—interact with them as regular elements.)

## Creating and Managing Tabs

### Starting the Browser

When you start the browser, Pydoll automatically creates and returns a Tab instance for the initial browser tab:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def start_browser():
    async with Chrome() as browser:
        # Initial tab is created automatically
        tab = await browser.start()
        
        print(f"Tab created with target ID: {tab._target_id}")
        await tab.go_to('https://example.com')
        
        title = await tab.execute_script('return document.title')
        print(f"Page title: {title}")

asyncio.run(start_browser())
```

### Creating Additional Tabs Programmatically

Use `browser.new_tab()` to create additional tabs with full control:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def create_multiple_tabs():
    async with Chrome() as browser:
        # Start with initial tab
        main_tab = await browser.start()
        
        # Create additional tabs with specific URLs
        search_tab = await browser.new_tab('https://google.com')
        docs_tab = await browser.new_tab('https://docs.python.org')
        news_tab = await browser.new_tab('https://news.ycombinator.com')
        
        # Each tab can be controlled independently
        await search_tab.find(name='q')  # Google search box
        await docs_tab.find(id='search-field')  # Python docs search
        await news_tab.find(class_name='storylink', find_all=True)  # HN stories
        
        # Get all opened tabs
        all_tabs = await browser.get_opened_tabs()
        print(f"Total tabs: {len(all_tabs)}")  # 4 (initial + 3 new)
        
        # Close specific tabs when done
        await search_tab.close()
        await docs_tab.close()
        await news_tab.close()

asyncio.run(create_multiple_tabs())
```

!!! tip "URL Parameter Optional"
    You can create tabs without specifying a URL: `await browser.new_tab()`. The tab will open with a blank page (`about:blank`), ready for navigation.

### Handling User-Opened Tabs

When users click links with `target="_blank"` or use "Open in new tab", Pydoll can detect and manage these tabs:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def handle_user_tabs():
    async with Chrome() as browser:
        main_tab = await browser.start()
        await main_tab.go_to('https://example.com')
        
        # Record initial tab count
        initial_tabs = await browser.get_opened_tabs()
        print(f"Initial tabs: {len(initial_tabs)}")
        
        # Click a link that opens a new tab (target="_blank")
        external_link = await main_tab.find(text='Open in New Tab')
        await external_link.click()
        
        # Wait for new tab to open
        await asyncio.sleep(2)
        
        # Detect new tabs
        current_tabs = await browser.get_opened_tabs()
        print(f"Current tabs: {len(current_tabs)}")
        
        # Find the newly opened tab (last in the list)
        if len(current_tabs) > len(initial_tabs):
            new_tab = current_tabs[-1]
            
            # Work with the new tab
            url = await new_tab.current_url
            print(f"New tab URL: {url}")
            
            await new_tab.go_to('https://different-site.com')
            title = await new_tab.execute_script('return document.title')
            print(f"New tab title: {title}")
            
            # Close it when done
            await new_tab.close()

asyncio.run(handle_user_tabs())
```

### Listing All Open Tabs

Use `browser.get_opened_tabs()` to retrieve all currently open tabs:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def list_tabs():
    async with Chrome() as browser:
        # Use the initial tab returned by start()
        initial_tab = await browser.start()
        await initial_tab.go_to('https://example.com')
        
        # Open several more tabs
        await browser.new_tab('https://github.com')
        await browser.new_tab('https://stackoverflow.com')
        await browser.new_tab('https://reddit.com')
        
        # Get all tabs
        all_tabs = await browser.get_opened_tabs()
        
        # Inspect each tab
        for i, tab in enumerate(all_tabs, 1):
            url = await tab.current_url
            title = await tab.execute_script('return document.title')
            print(f"Tab {i}: {title} - {url}")

asyncio.run(list_tabs())
```

## Concurrent Tab Operations

Pydoll's async architecture enables powerful concurrent workflows across multiple tabs:

### Parallel Data Collection

Process multiple pages simultaneously for maximum efficiency:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def scrape_page(tab, url):
    """Scrape a single page within a given tab."""
    await tab.go_to(url)
    title = await tab.execute_script('return document.title')
    articles = await tab.find(class_name='article', find_all=True)
    content = [await article.text for article in articles[:5]]

    return {
        'url': url,
        'title': title,
        'articles_count': len(articles),
        'sample_content': content
    }

async def concurrent_scraping():
    urls = [
        'https://example.com/page1',
        'https://example.com/page2',
        'https://example.com/page3',
        'https://example.com/page4',
    ]

    async with Chrome() as browser:
        # Start browser and open the first tab
        initial_tab = await browser.start()
        # Create one tab per URL
        tabs = [initial_tab] + [await browser.new_tab() for _ in urls[1:]]

        # Run all scrapers concurrently
        results = await asyncio.gather(*[
            scrape_page(tab, url) for tab, url in zip(tabs, urls)
        ])

        # Display results
        for result in results:
            print(f"\n{result['title']}")
            print(f"  URL: {result['url']}")
            print(f"  Articles: {result['articles_count']}")
            if result['sample_content']:
                print(f"  Sample: {result['sample_content'][0][:100]}...")

asyncio.run(concurrent_scraping())
```

!!! tip "Performance Boost"
    Concurrent scraping can reduce total execution time by 5-10x compared to sequential processing, especially for I/O-bound tasks like page loading.

### Coordinated Multi-Tab Workflows

Orchestrate complex workflows that require multiple tabs to interact:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.network.events import NetworkEvent, RequestWillBeSentEvent

async def multi_tab_workflow():
    async with Chrome() as browser:
        # Use the initial tab for login
        login_tab = await browser.start()
        await login_tab.go_to('https://app.example.com/login')
        await asyncio.sleep(2)
        
        username = await login_tab.find(id='username')
        password = await login_tab.find(id='password')
        
        await username.type_text('admin@example.com')
        await password.type_text('secure_password')
        
        login_btn = await login_tab.find(id='login')
        await login_btn.click()
        await asyncio.sleep(3)
        
        # Tab 2: Navigate to data export page
        export_tab = await browser.new_tab('https://app.example.com/export')
        await asyncio.sleep(2)
        
        export_btn = await export_tab.find(text='Export Data')
        await export_btn.click()
        
        # Tab 3: Monitor API calls in a dashboard
        monitor_tab = await browser.new_tab('https://app.example.com/dashboard')
        await monitor_tab.enable_network_events()
        
        # Track API calls
        api_calls = []
        async def track_api(event: RequestWillBeSentEvent):
            url = event['params']['request']['url']
            if '/api/' in url:
                api_calls.append(url)
        
        await monitor_tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, track_api)
        await asyncio.sleep(5)
        
        print(f"Tracked {len(api_calls)} API calls:")
        for call in api_calls[:10]:
            print(f"  - {call}")
        
        # Clean up
        await login_tab.close()
        await export_tab.close()
        await monitor_tab.close()

asyncio.run(multi_tab_workflow())
```

## Tab Lifecycle and Cleanup

### Explicit Tab Closure

Always close tabs when you're done to free browser resources:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def explicit_cleanup():
    async with Chrome() as browser:
        initial_tab = await browser.start()
        
        # Create tabs for different tasks
        tab1 = await browser.new_tab('https://example.com')
        tab2 = await browser.new_tab('https://example.org')
        
        # Do work with tabs
        await tab1.go_to('https://different-site.com')
        await tab2.take_screenshot('/tmp/screenshot.png')
        
        # Explicitly close tabs
        await tab1.close()
        await tab2.close()
        
        # Verify tabs are closed
        remaining = await browser.get_opened_tabs()
        print(f"Remaining tabs: {len(remaining)}")  # Should be 1 (initial)

asyncio.run(explicit_cleanup())
```

!!! warning "Memory Leaks"
    Failing to close tabs in long-running automation can lead to memory exhaustion. Each tab consumes browser resources (memory, file handles, network connections).

### Using Context Managers for Automatic Cleanup

While Pydoll doesn't provide a built-in tab context manager, you can create your own:

```python
import asyncio
from contextlib import asynccontextmanager
from pydoll.browser.chromium import Chrome

@asynccontextmanager
async def managed_tab(browser, url=None):
    """Context manager for automatic tab cleanup."""
    tab = await browser.new_tab(url)
    try:
        yield tab
    finally:
        await tab.close()

async def auto_cleanup_example():
    async with Chrome() as browser:
        initial_tab = await browser.start()
        
        # Tab automatically closes when exiting the context
        async with managed_tab(browser, 'https://example.com') as tab:
            title = await tab.execute_script('return document.title')
            print(f"Title: {title}")
            
            await tab.take_screenshot('/tmp/page.png')
        # Tab is automatically closed here
        
        tabs = await browser.get_opened_tabs()
        print(f"Tabs after context exit: {len(tabs)}")  # 1 (initial_tab only)

asyncio.run(auto_cleanup_example())
```

### Browser Cleanup

When the browser closes, all tabs are automatically closed:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def browser_cleanup():
    # Using context manager - automatic cleanup
    async with Chrome() as browser:
        initial_tab = await browser.start()
        
        # Create multiple tabs
        await browser.new_tab('https://example.com')
        await browser.new_tab('https://github.com')
        await browser.new_tab('https://stackoverflow.com')
        
        tabs = await browser.get_opened_tabs()
        print(f"Tabs open: {len(tabs)}")  # 4 (initial + 3 new)
    
    # All tabs automatically closed when browser exits
    print("Browser closed, all tabs cleaned up")

asyncio.run(browser_cleanup())
```

## Tab State Management

### Checking Tab State

Query various aspects of a tab's current state:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def check_tab_state():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # Check current URL
        url = await tab.current_url
        print(f"Current URL: {url}")
        
        # Check page source
        source = await tab.page_source
        print(f"Page source length: {len(source)} characters")
        
        # Check enabled event domains
        print(f"Page events enabled: {tab.page_events_enabled}")
        print(f"Network events enabled: {tab.network_events_enabled}")
        print(f"DOM events enabled: {tab.dom_events_enabled}")
        
        # Enable events and check again
        await tab.enable_network_events()
        print(f"Network events enabled: {tab.network_events_enabled}")  # True

asyncio.run(check_tab_state())
```

### Tab Identification

Each tab has unique identifiers:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def tab_identification():
    async with Chrome() as browser:
        tab1 = await browser.start()
        tab2 = await browser.new_tab()
        
        # Target ID - unique identifier assigned by browser
        print(f"Tab 1 target ID: {tab1._target_id}")
        print(f"Tab 2 target ID: {tab2._target_id}")
        
        # Connection details
        print(f"Tab 1 connection port: {tab1._connection_port}")
        print(f"Tab 2 connection port: {tab2._connection_port}")
        
        # Browser context ID (usually None for default context)
        print(f"Tab 1 context ID: {tab1._browser_context_id}")
        print(f"Tab 2 context ID: {tab2._browser_context_id}")

asyncio.run(tab_identification())
```

## Advanced Tab Features

### Bringing Tabs to Front

Make a specific tab visible (bring to foreground):

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def bring_to_front():
    async with Chrome() as browser:
        tab1 = await browser.start()
        tab2 = await browser.new_tab('https://github.com')
        tab3 = await browser.new_tab('https://stackoverflow.com')
        
        # tab3 is currently in front (last created)
        await asyncio.sleep(2)
        
        # Bring tab1 to front
        await tab1.bring_to_front()
        print("Tab 1 brought to front")
        
        await asyncio.sleep(2)
        
        # Bring tab2 to front
        await tab2.bring_to_front()
        print("Tab 2 brought to front")

asyncio.run(bring_to_front())
```

### Tab-Specific Network Monitoring

Each tab can independently monitor its own network activity:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def tab_network_monitoring():
    async with Chrome() as browser:
        # Use initial tab for monitored navigation
        tab1 = await browser.start()
        await tab1.go_to('https://example.com')
        
        # Create second tab without monitoring
        tab2 = await browser.new_tab('https://github.com')
        
        # Enable network monitoring only on tab1
        await tab1.enable_network_events()
        
        # Navigate both tabs
        await tab1.go_to('https://example.com/page1')
        await tab2.go_to('https://github.com/explore')
        
        await asyncio.sleep(3)
        
        # Get network logs only from tab1
        tab1_logs = await tab1.get_network_logs()
        print(f"Tab 1 network requests: {len(tab1_logs)}")
        
        # tab2 has no network monitoring
        print(f"Tab 2 network events enabled: {tab2.network_events_enabled}")  # False

asyncio.run(tab_network_monitoring())
```

### Tab-Specific Event Handlers

Register different event handlers on different tabs:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.page.events import PageEvent

async def tab_specific_events():
    async with Chrome() as browser:
        # Use initial tab as first tab
        tab1 = await browser.start()
        tab2 = await browser.new_tab()
        
        # Enable page events on both
        await tab1.enable_page_events()
        await tab2.enable_page_events()
        
        # Different handlers for each tab
        async def tab1_handler(event):
            print("Tab 1 loaded!")
        
        async def tab2_handler(event):
            print("Tab 2 loaded!")
        
        await tab1.on(PageEvent.LOAD_EVENT_FIRED, tab1_handler)
        await tab2.on(PageEvent.LOAD_EVENT_FIRED, tab2_handler)
        
        # Navigate both tabs
        await tab1.go_to('https://example.com')
        await tab2.go_to('https://github.com')
        
        await asyncio.sleep(2)

asyncio.run(tab_specific_events())
```

## Performance Considerations

| Scenario | Resource Impact | Recommendation |
|----------|----------------|----------------|
| **1-5 tabs** | Low | Direct management, no special handling |
| **5-20 tabs** | Moderate | Use semaphores to limit concurrency |
| **20-50 tabs** | High | Batch processing, close tabs aggressively |
| **50+ tabs** | Very High | Consider sequential processing or multiple browsers |

### Memory Usage

Each tab consumes approximately:

- **Base memory**: 50-100 MB
- **With network events**: +10-20 MB
- **With DOM events**: +20-50 MB
- **Complex page (SPA)**: +100-300 MB

For 20 tabs with network monitoring: ~1.5-3 GB of memory.

## Common Patterns

### Sequential Processing with Single Tab

```python
async def sequential_pattern():
    async with Chrome() as browser:
        tab = await browser.start()
        
        for url in urls:
            await tab.go_to(url)
            # Extract data
            await tab.clear_callbacks()  # Clean up events

asyncio.run(sequential_pattern())
```

### Parallel Processing with Multiple Tabs

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def parallel_pattern():
    urls = [
        'https://example.com/page1',
        'https://example.com/page2',
        'https://example.com/page3',
        'https://example.com/page4',
    ]

    async with Chrome() as browser:
        # Start browser and get initial tab
        initial_tab = await browser.start()
        # Create one tab per URL (reusing initial tab for the first)
        tabs = [initial_tab] + [await browser.new_tab() for _ in urls[1:]]

        async def process_page(tab, url):
            """Process a single page within the given tab."""
            try:
                await tab.go_to(url)
                await asyncio.sleep(2)
                title = await tab.evaluate('document.title')
                print(f"[{url}] {title}")
            finally:
                if tab is not initial_tab:
                    await tab.close()

        # Run all tabs concurrently
        await asyncio.gather(*[
            process_page(tab, url) for tab, url in zip(tabs, urls)
        ])

asyncio.run(parallel_pattern())
```

### Worker Pool Pattern

```python
async def worker_pool_pattern():
    async with Chrome() as browser:
        # Use initial tab as first worker
        initial_tab = await browser.start()
        
        # Create additional worker tabs (5 workers total: 1 initial + 4 new)
        workers = [initial_tab] + [await browser.new_tab() for _ in range(4)]
        
        # Distribute work across all workers
        for url in urls:
            worker = workers[urls.index(url) % len(workers)]
            await worker.go_to(url)
            # Process...
        
        # Cleanup all workers (including initial tab)
        for worker in workers:
            await worker.close()

asyncio.run(worker_pool_pattern())
```

!!! tip "Reusing the Initial Tab"
    Always use the tab returned by `browser.start()` instead of letting it sit idle. This saves browser resources and improves performance. In the examples above, the initial tab is reused as the first worker or for the first URL in the batch.

## See Also

- **[Browser Contexts](contexts.md)** - Isolated browser sessions
- **[Cookies & Sessions](cookies-sessions.md)** - Managing cookies across tabs
- **[Event System](../advanced/event-system.md)** - Tab-specific event handling
- **[Concurrent Scraping](../../features.md#concurrent-scraping)** - Real-world examples

Multi-tab management in Pydoll provides the foundation for building scalable, efficient browser automation. By understanding the tab lifecycle, singleton pattern, and best practices, you can create robust automation workflows that handle complex multi-page scenarios with ease.


================================================
FILE: docs/en/features/configuration/browser-options.md
================================================
# Browser Options (ChromiumOptions)

`ChromiumOptions` is your central configuration hub for customizing browser behavior. It controls everything from command-line arguments and binary location to page load states and content preferences.

!!! info "Related Documentation"
    - **[Browser Preferences](browser-preferences.md)** - Deep dive into Chromium's internal preference system
    - **[Browser Management](../browser-management/tabs.md)** - Working with browser instances and tabs
    - **[Contexts](../browser-management/contexts.md)** - Isolated browsing contexts

## Quick Start

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions
from pydoll.constants import PageLoadState

async def main():
    # Create and configure options
    options = ChromiumOptions()
    
    # Basic configuration
    options.headless = True
    options.start_timeout = 15
    options.page_load_state = PageLoadState.INTERACTIVE
    
    # Add command-line arguments
    options.add_argument('--disable-gpu')
    options.add_argument('--window-size=1920,1080')
    
    # Helper methods for common settings
    options.block_notifications = True
    options.block_popups = True
    options.set_default_download_directory('/tmp/downloads')
    
    # Use the configured options
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')

asyncio.run(main())
```

## Core Properties

### Command-Line Arguments

Chromium supports hundreds of command-line switches that control browser behavior at the deepest level. Use `add_argument()` to pass flags directly to the browser process.

```python
options = ChromiumOptions()

# Add single argument
options.add_argument('--disable-blink-features=AutomationControlled')

# Add argument with value
options.add_argument('--window-size=1920,1080')
options.add_argument('--user-agent=Mozilla/5.0 ...')

# Remove argument if needed
options.remove_argument('--window-size=1920,1080')

# Get all arguments
all_args = options.arguments
```

!!! tip "Argument Format"
    - Arguments starting with `--` are flags: `--headless`, `--disable-gpu`
    - Arguments with `=` have values: `--window-size=1920,1080`
    - Some accept multiple values: `--disable-features=Feature1,Feature2`

**See [Command-Line Arguments Reference](#command-line-arguments-reference) below for comprehensive lists.**

### Binary Location

Specify a custom browser executable instead of using the system default:

```python
options = ChromiumOptions()

# Linux
options.binary_location = '/opt/google/chrome-beta/chrome'

# macOS
options.binary_location = '/Applications/Google Chrome Canary.app/Contents/MacOS/Google Chrome Canary'

# Windows
options.binary_location = r'C:\Program Files\Google\Chrome Beta\Application\chrome.exe'
```

!!! info "When to Set Binary Location"
    - Testing different Chrome versions (Stable, Beta, Canary)
    - Using Chromium instead of Chrome
    - Using portable browser installations
    - Running specific builds for debugging

### Start Timeout

Control how long Pydoll waits for the browser to start and respond:

```python
options = ChromiumOptions()
options.start_timeout = 20  # seconds (default: 10)
```

!!! warning "Timeout Considerations"
    - **Too low**: Browser may not fully initialize, causing startup failures
    - **Too high**: Hangs will block your automation for longer
    - **Recommended**: 10-15s for most cases, 20-30s for slow systems or heavy browser profiles

### Headless Mode

Run the browser without a visible UI:

```python
options = ChromiumOptions()
options.headless = True  # Automatically adds --headless argument

# Or manually
options.add_argument('--headless')
options.add_argument('--headless=new')  # New headless mode (Chrome 109+)
```

| Mode | Argument | Description |
|------|----------|-------------|
| **Headful** | (none) | Visible browser window (default) |
| **Classic Headless** | `--headless` | Legacy headless mode |
| **New Headless** | `--headless=new` | Modern headless (Chrome 109+, better compatibility) |

!!! tip "New Headless Mode"
    The `--headless=new` mode (Chrome 109+) provides better compatibility with modern web features and is harder to detect. Use it for production automation.

### Page Load State

Control when `tab.go_to()` considers a page "loaded":

```python
from pydoll.constants import PageLoadState

options = ChromiumOptions()
options.page_load_state = PageLoadState.INTERACTIVE  # or PageLoadState.COMPLETE
```

| State | When Navigation Completes | Use Case |
|-------|---------------------------|----------|
| `COMPLETE` (default) | `load` event fired, all resources loaded | Wait for images, fonts, scripts |
| `INTERACTIVE` | `DOMContentLoaded` fired, DOM ready | Faster navigation, interact with DOM immediately |

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions
from pydoll.constants import PageLoadState

async def compare_load_states():
    # Complete mode - waits for everything
    options_complete = ChromiumOptions()
    options_complete.page_load_state = PageLoadState.COMPLETE
    
    async with Chrome(options=options_complete) as browser:
        tab = await browser.start()
        
        import time
        start = time.time()
        await tab.go_to('https://example.com')
        complete_time = time.time() - start
        print(f"COMPLETE mode: {complete_time:.2f}s")
    
    # Interactive mode - DOM ready is enough
    options_interactive = ChromiumOptions()
    options_interactive.page_load_state = PageLoadState.INTERACTIVE
    
    async with Chrome(options=options_interactive) as browser:
        tab = await browser.start()
        
        start = time.time()
        await tab.go_to('https://example.com')
        interactive_time = time.time() - start
        print(f"INTERACTIVE mode: {interactive_time:.2f}s")

asyncio.run(compare_load_states())
```

!!! tip "When to Use INTERACTIVE"
    Use `INTERACTIVE` when:
    
    - You only need DOM access, not images/fonts
    - Scraping text content and structure
    - Speed is critical
    - The page has many slow-loading resources
    
    Stick with `COMPLETE` (default) when:
    
    - Taking screenshots (need images loaded)
    - Waiting for JavaScript-heavy apps to fully initialize
    - Testing page load performance

## Command-Line Arguments Reference

Chromium supports hundreds of command-line switches. Below are the most useful for automation, organized by category.

!!! info "Full Reference"
    Complete list of all Chromium switches: [Peter Beverloo's Chromium Command Line Switches](https://peter.sh/experiments/chromium-command-line-switches/)

### Performance & Resource Management

Optimize browser performance for faster automation:

```python
options = ChromiumOptions()

# Disable GPU acceleration (headless, Docker, CI/CD)
options.add_argument('--disable-gpu')
options.add_argument('--disable-software-rasterizer')

# Reduce memory usage
options.add_argument('--disable-dev-shm-usage')  # Docker: overcome /dev/shm size limit
options.add_argument('--disable-extensions')
options.add_argument('--disable-background-networking')

# Disable unnecessary features
options.add_argument('--disable-sync')  # Google account sync
options.add_argument('--disable-translate')
options.add_argument('--disable-background-timer-throttling')
options.add_argument('--disable-backgrounding-occluded-windows')
options.add_argument('--disable-renderer-backgrounding')

# Network optimizations
options.add_argument('--disable-features=NetworkPrediction')
options.add_argument('--dns-prefetch-disable')

# Window and rendering
options.add_argument('--window-size=1920,1080')
options.add_argument('--window-position=0,0')
options.add_argument('--force-device-scale-factor=1')
```

| Argument | Effect | When to Use |
|----------|--------|-------------|
| `--disable-gpu` | No GPU acceleration | Headless, Docker, servers without GPU |
| `--disable-dev-shm-usage` | Use `/tmp` instead of `/dev/shm` | Docker containers with small shared memory |
| `--disable-extensions` | Don't load any extensions | Clean, fast browser for automation |
| `--window-size=W,H` | Set initial window dimensions | Screenshots, consistent viewport |
| `--force-device-scale-factor=1` | Disable high-DPI scaling | Consistent rendering across systems |

### Stealth & Fingerprinting

Make your automation harder to detect with these command-line arguments:

| Argument | Purpose | Example |
|----------|---------|---------|
| `--disable-blink-features=AutomationControlled` | Remove `navigator.webdriver` flag | Essential for stealth |
| `--user-agent=...` | Set realistic, common user agent | Match target region/device |
| `--use-gl=swiftshader` | Software WebGL renderer | Avoid unique GPU fingerprints |
| `--force-webrtc-ip-handling-policy=...` | Prevent WebRTC IP leaks | Use `disable_non_proxied_udp` |
| `--lang=en-US` | Set browser language | Match target locale |
| `--accept-lang=en-US,en;q=0.9` | Accept-Language header | Realistic language preferences |
| `--tz=America/New_York` | Set timezone | Match target region |
| `--no-first-run` | Skip first-run wizards | Cleaner automation |
| `--no-default-browser-check` | Skip default browser prompt | Avoid UI interruptions |
| `--disable-reading-from-canvas` | Canvas fingerprinting mitigation | Reduce uniqueness |
| `--disable-features=AudioServiceOutOfProcess` | Audio fingerprinting mitigation | Reduce uniqueness |

!!! warning "Detection Arms Race"
    No single technique guarantees undetectability. Combine multiple strategies:
    
    1. **Command-line arguments** (this table)
    2. **Browser preferences** - [Browser Preferences - Stealth & Fingerprinting](browser-preferences.md#stealth-fingerprinting)
    3. **Human-like interactions** - [Human-Like Interactions](../automation/human-interactions.md)
    4. **Good IP reputation** - Use residential proxies with clean history

### Security & Privacy

Control security features and privacy settings:

```python
options = ChromiumOptions()

# Sandbox (disable for Docker/CI only)
options.add_argument('--no-sandbox')  # SECURITY RISK - use only in controlled environments
options.add_argument('--disable-setuid-sandbox')

# HTTPS/SSL
options.add_argument('--ignore-certificate-errors')  # Ignore SSL errors
options.add_argument('--ignore-ssl-errors')
options.add_argument('--allow-insecure-localhost')

# Privacy
options.add_argument('--disable-features=Translate')
options.add_argument('--disable-sync')
options.add_argument('--incognito')  # Open in incognito mode

# Permissions auto-grant (for testing)
options.add_argument('--use-fake-ui-for-media-stream')  # Auto-grant camera/mic
options.add_argument('--use-fake-device-for-media-stream')  # Use fake devices
```

!!! danger "Sandbox Warnings"
    **`--no-sandbox` is a security risk!** Only use it when:
    
    - Running in Docker containers (sandbox conflicts with container isolation)
    - CI/CD environments with restricted permissions
    - You fully trust the content being loaded
    
    **Never** use `--no-sandbox` when:
    
    - Visiting untrusted websites
    - Running user-submitted code
    - In production environments with external input

| Argument | Effect | Security Impact |
|----------|--------|-----------------|
| `--no-sandbox` | Disable Chrome sandbox | **HIGH RISK** - Allows code execution |
| `--ignore-certificate-errors` | Skip SSL validation | **MEDIUM RISK** - MITM attacks possible |
| `--incognito` | Private browsing mode | Safer - no persistent state |

### Debugging & Development

Tools for debugging automation and development:

```python
options = ChromiumOptions()

# DevTools
options.add_argument('--auto-open-devtools-for-tabs')

# Logging
options.add_argument('--enable-logging')
options.add_argument('--v=1')  # Verbosity level (0-3)
options.add_argument('--log-level=0')  # 0=INFO, 1=WARNING, 2=ERROR

# Crash handling
options.add_argument('--disable-crash-reporter')
options.add_argument('--no-crash-upload')

# Enable experimental features
options.add_argument('--enable-features=NetworkService,NetworkServiceInProcess')
options.add_argument('--enable-experimental-web-platform-features')

# JavaScript debugging
options.add_argument('--js-flags=--expose-gc')  # Expose garbage collector
```

!!! tip "Remote Debugging"
    Pydoll automatically manages the remote debugging port. To access Chrome DevTools:
    
    ```python
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Get the debugging port
        port = browser._connection_port
        print(f"DevTools available at: http://localhost:{port}")
        
        # Open this URL in your browser to access DevTools
    ```
    
    **Do not** use `--remote-debugging-port` argument - it will conflict with Pydoll's internal management!

### Display & Rendering

Control how the browser renders content:

```python
options = ChromiumOptions()

# Viewport and window
options.add_argument('--window-size=1920,1080')
options.add_argument('--window-position=0,0')
options.add_argument('--start-maximized')
options.add_argument('--start-fullscreen')

# High DPI displays
options.add_argument('--force-device-scale-factor=1')
options.add_argument('--high-dpi-support=1')

# Color and rendering
options.add_argument('--force-color-profile=srgb')
options.add_argument('--disable-accelerated-2d-canvas')
options.add_argument('--disable-accelerated-video-decode')

# Font rendering
options.add_argument('--font-render-hinting=none')
options.add_argument('--disable-font-subpixel-positioning')

# Animations
options.add_argument('--disable-animations')
options.add_argument('--wm-window-animations-disabled')
```

| Argument | Effect | Use Case |
|----------|--------|----------|
| `--window-size=W,H` | Set window dimensions | Screenshots, consistent viewport |
| `--start-maximized` | Open maximized window | UI testing, full-screen captures |
| `--force-device-scale-factor=1` | Disable DPI scaling | Consistent rendering across systems |
| `--disable-animations` | No CSS/UI animations | Faster testing, reduce flakiness |

### Proxy Configuration

Configure proxies for all network traffic:

```python
options = ChromiumOptions()

# HTTP/HTTPS proxy
options.add_argument('--proxy-server=http://proxy.example.com:8080')

# Authenticated proxy
options.add_argument('--proxy-server=http://user:pass@proxy.example.com:8080')

# SOCKS proxy
options.add_argument('--proxy-server=socks5://proxy.example.com:1080')

# Bypass proxy for specific hosts
options.add_argument('--proxy-bypass-list=localhost,127.0.0.1,*.local')

# Proxy auto-config (PAC) file
options.add_argument('--proxy-pac-url=http://proxy.example.com/proxy.pac')
```

!!! info "Proxy Authentication"
    For proxies requiring authentication, Pydoll automatically handles auth challenges when using the `--proxy-server` argument with credentials.
    
    See **[Request Interception](../network/interception.md)** for details on the Fetch domain interaction with proxies.

## Helper Methods

`ChromiumOptions` provides convenient methods for common configuration tasks:

### Download Management

```python
options = ChromiumOptions()

# Set download directory
options.set_default_download_directory('/home/user/downloads')

# Prompt for download location
options.prompt_for_download = True  # Ask user where to save
options.prompt_for_download = False  # Download silently (default)

# Allow multiple automatic downloads
options.allow_automatic_downloads = True  # Allow without prompt
options.allow_automatic_downloads = False  # Block or ask (default)
```

### Content Blocking

```python
options = ChromiumOptions()

# Block pop-ups
options.block_popups = True  # Block (default in most cases)
options.block_popups = False  # Allow

# Block notifications
options.block_notifications = True  # Block requests
options.block_notifications = False  # Allow sites to ask
```

### Privacy Controls

```python
options = ChromiumOptions()

# Password manager
options.password_manager_enabled = False  # Disable save password prompts
options.password_manager_enabled = True  # Enable (default)

# WebRTC leak protection (prevents real IP exposure through WebRTC)
options.webrtc_leak_protection = True  # Adds --force-webrtc-ip-handling-policy=disable_non_proxied_udp
options.webrtc_leak_protection = False  # Disable (default)
```

!!! tip "WebRTC Leak Protection"
    WebRTC can leak your real IP address even when using a proxy. Enable `webrtc_leak_protection` to block non-proxied UDP connections, preventing STUN requests from bypassing your proxy. This is **essential** when using proxies for anonymity. See **[Network Fundamentals - WebRTC](../../deep-dive/network/network-fundamentals.md#webrtc-and-ip-leakage)** for details.

### File Handling

```python
options = ChromiumOptions()

# PDF behavior
options.open_pdf_externally = True  # Download PDFs instead of viewing
options.open_pdf_externally = False  # View in browser (default)
```

### Internationalization

```python
options = ChromiumOptions()

# Accept languages (affects Content-Language header)
options.set_accept_languages('en-US,en;q=0.9,pt-BR;q=0.8')
```

## Complete Configuration Examples

### Fast Scraping Configuration

Optimized for speed and resource efficiency:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions
from pydoll.constants import PageLoadState

def create_fast_scraping_options() -> ChromiumOptions:
    """Ultra-fast configuration for web scraping."""
    options = ChromiumOptions()
    
    # Headless for speed
    options.headless = True
    
    # Faster page loads (DOM ready is enough for scraping)
    options.page_load_state = PageLoadState.INTERACTIVE
    
    # Disable unnecessary features
    options.add_argument('--disable-extensions')
    options.add_argument('--disable-gpu')
    options.add_argument('--disable-dev-shm-usage')
    options.add_argument('--disable-background-networking')
    options.add_argument('--disable-sync')
    options.add_argument('--disable-translate')
    
    # Block content that slows down loading
    options.block_notifications = True
    options.block_popups = True
    
    # Disable images for even faster loading (if you don't need them)
    options.add_argument('--blink-settings=imagesEnabled=false')
    
    # Network optimizations
    options.add_argument('--disable-features=NetworkPrediction')
    options.add_argument('--dns-prefetch-disable')
    
    return options

async def fast_scraping_example():
    options = create_fast_scraping_options()
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Blazingly fast navigation and scraping
        urls = ['https://example.com', 'https://example.org', 'https://example.net']
        
        for url in urls:
            await tab.go_to(url)
            title = await tab.execute_script('return document.title')
            print(f"{url}: {title}")

asyncio.run(fast_scraping_example())
```

### Full Stealth Configuration

For maximum undetectability, combine command-line arguments with browser preferences:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

def create_full_stealth_options() -> ChromiumOptions:
    """Complete stealth configuration combining arguments and preferences."""
    options = ChromiumOptions()
    
    # ===== Command-Line Arguments =====
    
    # Core stealth
    options.add_argument('--disable-blink-features=AutomationControlled')
    options.add_argument('--disable-features=IsolateOrigins,site-per-process')
    
    # User agent (use a recent, common one)
    options.add_argument('--user-agent=Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/130.0.0.0 Safari/537.36')
    
    # Language and locale
    options.add_argument('--lang=en-US')
    options.add_argument('--accept-lang=en-US,en;q=0.9')
    
    # WebGL (software renderer to avoid unique GPU signatures)
    options.add_argument('--use-gl=swiftshader')
    options.add_argument('--disable-features=WebGLDraftExtensions')
    
    # WebRTC IP leak prevention
    options.webrtc_leak_protection = True

    # Permissions and first-run
    options.add_argument('--no-first-run')
    options.add_argument('--no-default-browser-check')
    
    # Window size (common resolution)
    options.add_argument('--window-size=1920,1080')
    
    # ===== Browser Preferences =====
    # For comprehensive browser preferences configuration, see:
    # https://pydoll.tech/docs/features/configuration/browser-preferences/#stealth-fingerprinting
    
    return options

async def stealth_automation_example():
    options = create_full_stealth_options()
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Test on bot detection sites
        await tab.go_to('https://bot.sannysoft.com')
        await asyncio.sleep(5)
        
        # Your automation here...

asyncio.run(stealth_automation_example())
```

!!! warning "User-Agent Consistency is Critical"
    Setting `--user-agent` only changes the **HTTP header**, but detection systems also check `navigator.userAgent`, `navigator.platform`, `navigator.vendor`, and other JavaScript properties. **Inconsistencies between these values are a strong bot indicator.**
    
    For example, if your HTTP User-Agent says "Windows" but `navigator.platform` says "Linux", you'll be flagged immediately.
    
    **Solution**: You must also override JavaScript properties via CDP to maintain consistency. See **[Browser Fingerprinting - User-Agent Consistency](../../deep-dive/fingerprinting/browser-fingerprinting.md#user-agent-consistency)** for detailed explanation and implementation using `Page.addScriptToEvaluateOnNewDocument`.
    
    This is why comprehensive stealth requires both command-line arguments AND browser preferences configuration.

!!! tip "Complete Stealth Strategy"
    Command-line arguments are only part of the solution. For maximum stealth:
    
    1. **Use arguments above** (navigator.webdriver, WebGL, WebRTC)
    2. **Configure browser preferences** - See [Browser Preferences - Stealth & Fingerprinting](browser-preferences.md#stealth-fingerprinting)
    3. **Human-like interactions** - See [Human-Like Interactions](../automation/human-interactions.md)
    4. **Good proxy/IP reputation** - Use residential proxies

### Docker/CI Configuration

For containerized environments:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions
from pydoll.constants import PageLoadState

def create_docker_options() -> ChromiumOptions:
    """Configuration for Docker containers and CI/CD."""
    options = ChromiumOptions()
    
    # Required for Docker
    options.headless = True
    options.add_argument('--no-sandbox')  # Sandbox conflicts with container isolation
    options.add_argument('--disable-dev-shm-usage')  # Overcome /dev/shm size limit
    
    # Stability
    options.add_argument('--disable-gpu')
    options.add_argument('--disable-software-rasterizer')
    
    # Memory optimization
    options.add_argument('--disable-extensions')
    options.add_argument('--disable-background-networking')
    
    # Faster page loads for CI
    options.page_load_state = PageLoadState.INTERACTIVE
    
    # Increase timeout for slow CI runners
    options.start_timeout = 20
    
    # Crash handling
    options.add_argument('--disable-crash-reporter')
    
    return options

async def ci_testing_example():
    options = create_docker_options()
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Run your tests...
        await tab.go_to('https://example.com')
        assert await tab.execute_script('return document.title') == 'Example Domain'

asyncio.run(ci_testing_example())
```

## Troubleshooting

### Browser Won't Start

```python
# Increase timeout
options.start_timeout = 30

# Check binary location
options.binary_location = '/path/to/chrome'

# Docker/CI issues
options.add_argument('--no-sandbox')
options.add_argument('--disable-dev-shm-usage')
```

### Slow Performance

```python
# Disable GPU if not needed
options.add_argument('--disable-gpu')

# Disable images
options.add_argument('--blink-settings=imagesEnabled=false')

# Use INTERACTIVE load state
options.page_load_state = PageLoadState.INTERACTIVE

# Disable unnecessary features
options.add_argument('--disable-extensions')
options.add_argument('--disable-background-networking')
```

### Memory Issues in Docker

```python
# Essential for Docker
options.add_argument('--disable-dev-shm-usage')

# Reduce memory footprint
options.add_argument('--disable-extensions')
options.add_argument('--disable-gpu')
options.add_argument('--single-process')  # Last resort (can be unstable)
```

## Further Reading

- **[Browser Preferences](browser-preferences.md)** - Chromium's internal preference system
- **[Stealth Automation](../automation/human-interactions.md)** - Human-like interactions
- **[Contexts](../browser-management/contexts.md)** - Isolated browsing contexts
- **[Network Interception](../network/interception.md)** - Request/response manipulation

!!! tip "Experimentation is Key"
    Browser configuration is highly dependent on your specific use case. Start with the examples here, then adjust based on your needs. Use `browser._connection_port` to access DevTools and inspect what's happening inside the browser.


================================================
FILE: docs/en/features/configuration/browser-preferences.md
================================================
# Custom Browser Preferences

One of Pydoll's most powerful features is direct access to Chromium's internal preference system. Unlike traditional browser automation tools that only expose a limited set of options, Pydoll gives you the same level of control that extensions and enterprise administrators have, allowing you to configure **any** browser setting available in Chromium's source code.

## Why Browser Preferences Matter

Browser preferences control every aspect of how Chromium behaves:

- **Performance**: Disable features you don't need for faster page loads
- **Privacy**: Control what data the browser collects and sends
- **Automation**: Remove user prompts and confirmations that break workflows
- **Stealth**: Create realistic browser fingerprints to avoid detection
- **Enterprise**: Apply policies typically only available through Group Policy

!!! info "The Power of Direct Access"
    Most automation tools only expose 10-20 common settings. Pydoll gives you access to **hundreds** of preferences, from download behavior to search suggestions, from network prediction to plugin management. If Chromium can do it, you can configure it.

## Quick Start

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def preferences_example():
    options = ChromiumOptions()
    
    # Set preferences using a dict
    options.browser_preferences = {
        'download': {
            'default_directory': '/tmp/downloads',
            'prompt_for_download': False
        },
        'profile': {
            'default_content_setting_values': {
                'notifications': 2  # Block notifications
            }
        }
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # Downloads go to /tmp/downloads automatically
        # No notification prompts will appear

asyncio.run(preferences_example())
```

## Understanding Browser Preferences

### What Are Preferences?

Chromium stores all user-configurable settings in a JSON file called `Preferences`, located in the browser's user data directory. This file contains **everything** from your homepage URL to whether images load automatically.

**Typical location:**

- **Linux**: `~/.config/google-chrome/Default/Preferences`
- **macOS**: `~/Library/Application Support/Google/Chrome/Default/Preferences`
- **Windows**: `%LOCALAPPDATA%\Google\Chrome\User Data\Default\Preferences`

### Preferences File Structure

The Preferences file is a nested JSON object:

```json
{
  "download": {
    "default_directory": "/home/user/Downloads",
    "prompt_for_download": true
  },
  "profile": {
    "default_content_setting_values": {
      "notifications": 1,
      "popups": 0
    },
    "password_manager_enabled": true
  },
  "search": {
    "suggest_enabled": true
  },
  "net": {
    "network_prediction_options": 1
  }
}
```

Each dot-separated preference name in Chromium's source maps to a nested JSON path:

- `download.default_directory` → `{'download': {'default_directory': ...}}`
- `profile.password_manager_enabled` → `{'profile': {'password_manager_enabled': ...}}`

### How Chromium Uses Preferences

When Chromium starts:

1. **Reads** the Preferences file from disk
2. **Applies** these settings to configure browser behavior
3. **Updates** the file when users change settings via UI
4. **Falls back** to defaults if preferences are missing

Pydoll intercepts step 1 by pre-populating the Preferences file before the browser starts, ensuring your custom settings are applied from the very first page load.

## How It Works in Pydoll

### Setting Preferences

Use the `browser_preferences` property to set any preference:

```python
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()

# Direct assignment - merges with existing preferences
options.browser_preferences = {
    'download': {'default_directory': '/tmp'},
    'intl': {'accept_languages': 'pt-BR,en-US'}
}

# Multiple assignments are merged, not replaced
options.browser_preferences = {
    'profile': {'password_manager_enabled': False}
}

# Both sets of preferences are now active
```

!!! warning "Preferences Are Merged, Not Replaced"
    When you set `browser_preferences` multiple times, the new preferences are **merged** with existing ones. Only the specific keys you set are updated; everything else is preserved.
    
    ```python
    options.browser_preferences = {'download': {'prompt': False}}
    options.browser_preferences = {'profile': {'password_manager_enabled': False}}
    
    # Result: BOTH preferences are set
    # {'download': {'prompt': False}, 'profile': {'password_manager_enabled': False}}
    ```

### Nested Path Syntax

Preferences use nested dictionaries that mirror Chromium's dot-notation:

```python
# Chromium source code constant:
# const char kDownloadDefaultDirectory[] = "download.default_directory";

# Translates to Python dict:
options.browser_preferences = {
    'download': {
        'default_directory': '/path/to/downloads'
    }
}
```

The deeper the nesting, the more specific the preference:

```python
# Top-level: profile
# Second-level: default_content_setting_values  
# Third-level: notifications

options.browser_preferences = {
    'profile': {
        'default_content_setting_values': {
            'notifications': 2,  # Block
            'geolocation': 2,    # Block
            'media_stream': 2    # Block
        }
    }
}
```

## Practical Use Cases

### 1. Performance Optimization

Disable resource-intensive features for faster automation:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def performance_optimized_browser():
    options = ChromiumOptions()
    options.browser_preferences = {
        # Disable network prediction and prefetching
        'net': {
            'network_prediction_options': 2  # 2 = Never predict
        },
        # Disable image loading
        'profile': {
            'default_content_setting_values': {
                'images': 2  # 2 = Block, 1 = Allow
            }
        },
        # Disable plugins
        'webkit': {
            'webprefs': {
                'plugins_enabled': False
            }
        },
        # Disable spell check
        'browser': {
            'enable_spellchecking': False
        }
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Pages load 3-5x faster without images and unnecessary features
        await tab.go_to('https://example.com')
        print("Fast loading complete!")

asyncio.run(performance_optimized_browser())
```

!!! tip "Performance Impact"
    Disabling images alone can reduce page load time by 50-70% for image-heavy sites. Combine with disabling prefetch, spell check, and plugins for maximum speed.

### 2. Privacy & Anti-Tracking

Create a privacy-focused browser configuration:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def privacy_focused_browser():
    options = ChromiumOptions()
    options.browser_preferences = {
        # Enable Do Not Track
        'enable_do_not_track': True,
        
        # Disable referrers
        'enable_referrers': False,
        
        # Disable Safe Browsing (sends URLs to Google)
        'safebrowsing': {
            'enabled': False
        },
        
        # Disable password manager
        'profile': {
            'password_manager_enabled': False
        },
        
        # Disable autofill
        'autofill': {
            'enabled': False,
            'profile_enabled': False
        },
        
        # Disable search suggestions (sends queries to search engine)
        'search': {
            'suggest_enabled': False
        },
        
        # Disable telemetry and metrics
        'user_experience_metrics': {
            'reporting_enabled': False
        },
        
        # Block third-party cookies
        'profile': {
            'block_third_party_cookies': True,
            'cookie_controls_mode': 1
        }
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        print("Privacy-focused browser ready!")

asyncio.run(privacy_focused_browser())
```

### 3. Silent Downloads

Automate file downloads without user interaction:

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def silent_download_automation():
    download_dir = Path.home() / 'automation_downloads'
    download_dir.mkdir(exist_ok=True)
    
    options = ChromiumOptions()
    options.browser_preferences = {
        'download': {
            'default_directory': str(download_dir),
            'prompt_for_download': False,
            'directory_upgrade': True
        },
        'profile': {
            'default_content_setting_values': {
                'automatic_downloads': 1  # 1 = Allow, 2 = Block
            }
        },
        # Always download PDFs instead of opening in viewer
        'plugins': {
            'always_open_pdf_externally': True
        }
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/downloads')
        
        # Click download links - files save automatically
        download_link = await tab.find(text='Download Report')
        await download_link.click()
        
        await asyncio.sleep(3)
        print(f"File downloaded to: {download_dir}")

asyncio.run(silent_download_automation())
```

### 4. Block Intrusive UI Elements

Remove popups, notifications, and prompts that break automation:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def clean_ui_browser():
    options = ChromiumOptions()
    options.browser_preferences = {
        'profile': {
            'default_content_setting_values': {
                'notifications': 2,      # Block notifications
                'popups': 0,             # Block popups
                'geolocation': 2,        # Block location requests
                'media_stream': 2,       # Block camera/mic access
                'media_stream_mic': 2,   # Block microphone
                'media_stream_camera': 2 # Block camera
            }
        },
        # Disable translation prompts
        'translate': {
            'enabled': False
        },
        # Disable save password prompt
        'credentials_enable_service': False,
        
        # Disable "Chrome is being controlled by automation" infobar
        'devtools': {
            'preferences': {
                'currentDockState': '"undocked"'
            }
        }
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        # No popups, no prompts, clean automation!

asyncio.run(clean_ui_browser())
```

### 5. Internationalization & Localization

Configure language and locale preferences:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def localized_browser():
    options = ChromiumOptions()
    options.browser_preferences = {
        # Accept languages (priority order)
        'intl': {
            'accept_languages': 'pt-BR,pt,en-US,en'
        },
        
        # Spellcheck languages
        'spellcheck': {
            'dictionaries': ['pt-BR', 'en-US']
        },
        
        # Translate settings
        'translate': {
            'enabled': True
        },
        'translate_blocked_languages': ['en'],  # Don't offer to translate English
        
        # Default character encoding
        'default_charset': 'UTF-8'
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        # Browser configured for Brazilian Portuguese

asyncio.run(localized_browser())
```

## Helper Methods

For common scenarios, Pydoll provides convenience methods:

```python
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()

# Download management
options.set_default_download_directory('/tmp/downloads')
options.prompt_for_download = False
options.allow_automatic_downloads = True
options.open_pdf_externally = True

# Content blocking
options.block_notifications = True
options.block_popups = True

# Privacy
options.password_manager_enabled = False

# Internationalization
options.set_accept_languages('pt-BR,en-US,en')
```

These methods are shortcuts that set the correct nested preferences for you:

```python
# This helper:
options.set_default_download_directory('/tmp')

# Is equivalent to:
options.browser_preferences = {
    'download': {
        'default_directory': '/tmp'
    }
}
```

!!! tip "Combine Helpers with Direct Preferences"
    Use helpers for common settings and `browser_preferences` for advanced configuration:
    
    ```python
    # Start with helpers
    options.block_notifications = True
    options.prompt_for_download = False
    
    # Add advanced preferences
    options.browser_preferences = {
        'net': {'network_prediction_options': 2},
        'webkit': {'webprefs': {'plugins_enabled': False}}
    }
    ```

## Finding Preferences in Chromium Source

### Source Code Reference

Chromium defines all preference constants in `pref_names.cc`:

**Official source**: [chromium/src/+/main/chrome/common/pref_names.cc](https://chromium.googlesource.com/chromium/src/+/main/chrome/common/pref_names.cc)

### Reading the Source

Preference constants use dot-notation that maps directly to nested dicts:

```cpp
// From Chromium source (pref_names.cc):
const char kDownloadDefaultDirectory[] = "download.default_directory";
const char kPromptForDownload[] = "download.prompt_for_download";
const char kSafeBrowsingEnabled[] = "safebrowsing.enabled";
const char kBlockThirdPartyCookies[] = "profile.block_third_party_cookies";
```

**Converts to Python:**

```python
options.browser_preferences = {
    'download': {
        'default_directory': '/path/to/dir',
        'prompt_for_download': False
    },
    'safebrowsing': {
        'enabled': False
    },
    'profile': {
        'block_third_party_cookies': True
    }
}
```

### Discovery Process

1. **Search the source**: Go to [pref_names.cc](https://chromium.googlesource.com/chromium/src/+/main/chrome/common/pref_names.cc)
2. **Find your preference**: Search for keywords (e.g., "download", "password", "notification")
3. **Note the constant name**: e.g., `kDownloadDefaultDirectory[] = "download.default_directory"`
4. **Convert to dict**: Split by dots and create nested structure

**Example - Finding notification preferences:**

```cpp
// Search for "notification" in pref_names.cc:
const char kPushMessagingAppIdentifierMap[] = 
    "gcm.push_messaging_application_id_map";
const char kDefaultNotificationsSetting[] = 
    "profile.default_content_setting_values.notifications";
```

```python
# Becomes:
options.browser_preferences = {
    'profile': {
        'default_content_setting_values': {
            'notifications': 2  # 2 = block, 1 = allow, 0 = ask
        }
    }
}
```

### Common Preference Patterns

| Category | Example Constant | Python Dict Path |
|----------|-----------------|------------------|
| Downloads | `download.default_directory` | `{'download': {'default_directory': ...}}` |
| Content Settings | `profile.default_content_setting_values.X` | `{'profile': {'default_content_setting_values': {'X': ...}}}` |
| Network | `net.network_prediction_options` | `{'net': {'network_prediction_options': ...}}` |
| Privacy | `safebrowsing.enabled` | `{'safebrowsing': {'enabled': ...}}` |
| Session | `session.restore_on_startup` | `{'session': {'restore_on_startup': ...}}` |

!!! warning "Undocumented Preferences"
    Not all preferences are documented. Some are:
    
    - **Experimental**: May change or be removed in future Chromium versions
    - **Internal**: Used by Chromium's internal systems
    - **Platform-specific**: Only work on certain operating systems
    
    Test thoroughly before relying on undocumented preferences.

## Useful Preferences Reference

Here's a curated list of interesting and useful preferences from Chromium's `pref_names.cc`:

### Content & Media Settings

```python
options.browser_preferences = {
    'profile': {
        'default_content_setting_values': {
            # Content control (0=ask, 1=allow, 2=block)
            'cookies': 1,                    # Allow cookies
            'images': 1,                     # Allow images (2 to block)
            'javascript': 1,                 # Allow JavaScript (2 to block)
            'plugins': 2,                    # Block plugins (Flash, etc.)
            'popups': 0,                     # Block popups
            'geolocation': 2,                # Block location requests
            'notifications': 2,              # Block notifications
            'media_stream': 2,               # Block camera/microphone
            'media_stream_mic': 2,           # Block microphone only
            'media_stream_camera': 2,        # Block camera only
            'automatic_downloads': 1,        # Allow automatic downloads
            'midi_sysex': 2,                 # Block MIDI access
            'clipboard': 1,                  # Allow clipboard access
            'sensors': 2,                    # Block motion sensors
            'usb_guard': 2,                  # Block USB device access
            'serial_guard': 2,               # Block serial port access
            'bluetooth_guard': 2,            # Block Bluetooth
            'file_system_write_guard': 2,    # Block file system writes
        }
    }
}
```

### Network & Performance

```python
options.browser_preferences = {
    'net': {
        # Network prediction: 0=always, 1=wifi only, 2=never
        'network_prediction_options': 2,
        
        # Quick check for server reachability
        'quick_check_enabled': False
    },
    
    # DNS prefetching
    'dns_prefetching': {
        'enabled': False  # Disable to reduce network traffic
    },
    
    # Preconnect to search results
    'search': {
        'suggest_enabled': False,           # Disable search suggestions
        'instant_enabled': False            # Disable instant results
    },
    
    # Alternate error pages
    'alternate_error_pages': {
        'enabled': False  # Don't suggest alternatives for 404s
    }
}
```

### Download Preferences

```python
options.browser_preferences = {
    'download': {
        'default_directory': '/path/to/downloads',
        'prompt_for_download': False,
        'directory_upgrade': True,
        'extensions_to_open': '',           # File types to auto-open
        'open_pdf_externally': True,        # Don't use internal PDF viewer
    },
    
    'download_bubble': {
        'partial_view_enabled': True        # Show download progress bubble
    },
    
    'safebrowsing': {
        'enabled': False  # Disable Safe Browsing download warnings
    }
}
```

### Privacy & Security

```python
options.browser_preferences = {
    # Do Not Track
    'enable_do_not_track': True,
    
    # Referrers
    'enable_referrers': False,
    
    # Safe Browsing
    'safebrowsing': {
        'enabled': False,                   # Disable Safe Browsing
        'enhanced': False                   # Disable enhanced protection
    },
    
    # Privacy Sandbox (Google's cookie replacement)
    'privacy_sandbox': {
        'apis_enabled': False,
        'topics_enabled': False,
        'fledge_enabled': False
    },
    
    # Third-party cookies
    'profile': {
        'block_third_party_cookies': True,
        'cookie_controls_mode': 1,          # Block third-party in incognito
        
        # Content settings
        'default_content_setting_values': {
            'cookies': 1,
            'third_party_cookie_blocking_enabled': True
        }
    },
    
    # WebRTC (can leak real IP)
    'webrtc': {
        'ip_handling_policy': 'default_public_interface_only',
        'multiple_routes_enabled': False,
        'nonproxied_udp_enabled': False
    }
}
```

### Autofill & Passwords

```python
options.browser_preferences = {
    'autofill': {
        'enabled': False,                   # Disable form autofill
        'profile_enabled': False,           # Disable address autofill
        'credit_card_enabled': False,       # Disable credit card autofill
        'credit_card_fido_auth_enabled': False
    },
    
    'profile': {
        'password_manager_enabled': False,
        'password_manager_leak_detection': False
    },
    
    'credentials_enable_service': False,
    'credentials_enable_autosignin': False
}
```

### Browser Behavior & UI

```python
import time

options.browser_preferences = {
    # Homepage and startup
    'homepage': 'https://www.google.com',
    'homepage_is_newtabpage': False,
    'newtab_page_location_override': 'https://www.google.com',
    
    'session': {
        'restore_on_startup': 1,            # 0=new tab, 1=restore, 4=specific URLs, 5=new tab page
        'startup_urls': ['https://www.google.com'],
        'session_data_status': 3            # Session data status (internal)
    },
    
    # Welcome page and window
    'browser': {
        'has_seen_welcome_page': True,      # Skip welcome screen
        'window_placement': {
            'bottom': 1032,                 # Window bottom position
            'left': 2247,                   # Window left position
            'right': 3192,                  # Window right position
            'top': 31,                      # Window top position
            'maximized': False,             # Window is maximized
            'work_area_bottom': 1080,       # Screen work area bottom
            'work_area_left': 1920,         # Screen work area left
            'work_area_right': 3840,        # Screen work area right
            'work_area_top': 0              # Screen work area top
        }
    },
    
    # Extensions
    'extensions': {
        'ui': {
            'developer_mode': False
        },
        'alerts': {
            'initialized': True
        },
        'theme': {
            'system_theme': 2               # 0=default, 1=light, 2=dark
        },
        'last_chrome_version': '130.0.6723.91'  # Must match your version
    },
    
    # Translate
    'translate': {
        'enabled': False                    # Disable translation prompts
    },
    'translate_blocked_languages': ['en'],  # Never translate English
    'translate_site_blacklist': [],         # Legacy (use blocklist_with_time)
    
    # Bookmarks
    'bookmark_bar': {
        'show_on_all_tabs': False
    },
    
    # Tabs
    'tabs': {
        'new_tab_position': 0               # 0=right, 1=after current
    },
    'pinned_tabs': [],                      # List of pinned tab URLs
    
    # New Tab Page (timestamps in Chrome format)
    'NewTabPage': {
        'PrevNavigationTime': str(int(time.time() * 1000000) + 11644473600000000)  # Chrome timestamp
    },
    'ntp': {
        'num_personal_suggestions': 6       # Number of suggestions (0-10)
    },
    
    # Toolbar customization
    'toolbar': {
        'pinned_chrome_labs_migration_complete': True
    }
}
```

!!! info "Chrome Timestamp Format"
    Chrome uses Windows FILETIME format: microseconds since January 1, 1601 UTC.
    
    Convert Python timestamp:
    ```python
    import time
    chrome_time = int(time.time() * 1000000) + 11644473600000000
    ```

### Spelling & Language

```python
options.browser_preferences = {
    'browser': {
        'enable_spellchecking': False       # Disable spell check
    },
    
    'spellcheck': {
        'dictionaries': ['en-US', 'pt-BR'], # Spell check languages
        'dictionary': '',                   # Legacy preference (keep empty)
        'use_spelling_service': False       # Don't send to Google
    },
    
    'intl': {
        'accept_languages': 'pt-BR,pt,en-US,en',
        'selected_languages': 'pt-BR,pt,en-US,en'  # Explicitly selected
    },
    
    # Translation behavior and history
    'translate': {
        'enabled': True
    },
    'translate_accepted_count': {
        'pt-BR': 0,
        'es': 5                             # Accepted 5 Spanish translations
    },
    'translate_denied_count_for_language': {
        'en': 10                            # Never translate English
    },
    'translate_ignored_count_for_language': {
        'en': 1
    },
    'translate_site_blocklist_with_time': {},  # Sites never to translate
    
    # Accessibility caption language
    'accessibility': {
        'captions': {
            'live_caption_language': 'pt-BR'
        }
    },
    
    # Language model counters (usage statistics)
    'language_model_counters': {
        'en': 2,                            # English word count
        'pt': 10                            # Portuguese word count
    }
}
```

!!! info "Language Model Counters"
    These counters track language usage statistics for Chrome's machine learning models:
    
    - Used for predicting user language preferences
    - Affects search suggestions and autocomplete
    - Higher counts indicate more frequent use
    - Realistic values: 0-1000 for occasional use, 1000+ for heavy use

### Accessibility

```python
options.browser_preferences = {
    'accessibility': {
        'image_labels_enabled': False       # Don't get image labels from Google
    },
    
    # Font settings
    'webkit': {
        'webprefs': {
            'default_font_size': 16,
            'default_fixed_font_size': 13,
            'minimum_font_size': 0,
            'minimum_logical_font_size': 6,
            'fonts': {
                'standard': {
                    'Zyyy': 'Arial'
                },
                'serif': {
                    'Zyyy': 'Times New Roman'
                }
            }
        }
    }
}
```

### Media & Audio

```python
options.browser_preferences = {
    # Audio
    'audio': {
        'mute_enabled': False               # Start with audio on/off
    },
    
    # Autoplay
    'media': {
        'autoplay_policy': 0,               # 0=allow, 1=user gesture, 2=document user activation
        'video_fullscreen_orientation_lock': False
    },
    
    # WebGL
    'webkit': {
        'webprefs': {
            'webgl_enabled': True,          # Enable/disable WebGL
            'webgl2_enabled': True
        }
    }
}
```

### Printing

```python
options.browser_preferences = {
    'printing': {
        'print_preview_sticky_settings': {
            'appState': '{\"version\":2,\"recentDestinations\":[{\"id\":\"Save as PDF\",\"origin\":\"local\"}],\"marginsType\":3,\"customMargins\":{\"marginTop\":63,\"marginRight\":192,\"marginBottom\":240,\"marginLeft\":260}}'
        }
    },
    
    'savefile': {
        'default_directory': '/tmp'         # Default save location for PDFs
    }
}
```

!!! tip "Printing appState Format"
    The `appState` is a JSON-encoded string. For easier manipulation:
    
    ```python
    import json
    
    app_state = {
        'version': 2,
        'recentDestinations': [{
            'id': 'Save as PDF',
            'origin': 'local'
        }],
        'marginsType': 3,                   # 0=default, 1=no margins, 2=minimum, 3=custom
        'customMargins': {
            'marginTop': 63,
            'marginRight': 192,
            'marginBottom': 240,
            'marginLeft': 260
        },
        'isHeaderFooterEnabled': False,
        'scaling': '100',
        'scalingType': 3,                   # 0=default, 1=fit to page, 2=fit to paper, 3=custom
        'isColorEnabled': True,
        'isDuplexEnabled': False,
        'isCssBackgroundEnabled': True,
        'dpi': {
            'horizontal_dpi': 300,
            'vertical_dpi': 300,
            'is_default': True
        },
        'mediaSize': {
            'name': 'ISO_A4',
            'width_microns': 210000,
            'height_microns': 297000,
            'custom_display_name': 'A4',
            'is_default': True
        }
    }
    
    # Convert to string for appState
    options.browser_preferences = {
        'printing': {
            'print_preview_sticky_settings': {
                'appState': json.dumps(app_state)
            }
        }
    }
    ```

### WebRTC & Peer-to-Peer

```python
options.browser_preferences = {
    'webrtc': {
        # IP handling policy
        'ip_handling_policy': 'default_public_interface_only',
        
        # UDP transport options
        'udp_port_range': '10000-10100',    # Restrict UDP port range
        
        # Disable peer-to-peer
        'multiple_routes_enabled': False,
        'nonproxied_udp_enabled': False,
        
        # Text log collection
        'text_log_collection_allowed': False
    }
}
```

### Site Isolation & Security

```python
options.browser_preferences = {
    # Site isolation
    'site_isolation': {
        'isolate_origins': '',              # Comma-separated origins to isolate
        'site_per_process': True            # Full site isolation
    },
    
    # Mixed content
    'mixed_content': {
        'auto_upgrade_enabled': True        # Upgrade HTTP to HTTPS
    },
    
    # SSL/TLS
    'ssl': {
        'rev_checking': {
            'enabled': True                 # Check certificate revocation
        }
    }
}
```

### Installation & Country Metadata

```python
import uuid
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.browser_preferences = {
    # Country ID at install (affects default settings and locale)
    'countryid_at_install': 16978,          # Varies by country (e.g., 16978 for Brazil)
    
    # Default apps installation state
    'default_apps_install_state': 3,        # 0=not installed, 1=installed, 3=migrated
    
    # Enterprise profile GUID (for managed browsers)
    'enterprise_profile_guid': str(uuid.uuid4()),
    
    # Default search provider
    'default_search_provider': {
        'guid': ''                          # Empty for default (Google)
    }
}
```

!!! info "Country ID Values"
    `countryid_at_install` is a numeric code representing the country where Chrome was first installed:
    
    - **16978**: Brazil (BR)
    - **16965**: United States (US)
    - **16967**: Great Britain (GB)
    - **16966**: Germany (DE)
    - **16972**: Japan (JP)
    - And many others...
    
    This affects default language, currency, and regional settings. For realistic fingerprinting, match this to your target region.

### Experimental Features

```python
options.browser_preferences = {
    # Chrome Labs experiments
    'browser': {
        'labs': {
            'enabled': False
        }
    },
    
    # Preloading
    'preload': {
        'enabled': False                    # Disable page preloading
    },
    
    # Smooth scrolling
    'smooth_scrolling': {
        'enabled': True
    },
    
    # Hardware acceleration
    'hardware_acceleration_mode': {
        'enabled': True                     # Disable for headless performance
    }
}
```

### DevTools & Developer Options

```python
options.browser_preferences = {
    'devtools': {
        'preferences': {
            # DevTools appearance
            'currentDockState': '"right"',              # "bottom", "right", "undocked"
            'uiTheme': '"dark"',                        # "dark", "light", "system"
            
            # Console settings
            'consoleTimestampsEnabled': 'true',
            'preserveConsoleLog': 'true',
            
            # Network panel
            'network.disableCache': 'false',
            'network.color-code-resource-types': 'true',
            'network-panel-split-view-state': '{"vertical":{"size":0}}',
            
            # Source maps
            'cssSourceMapsEnabled': 'true',
            'jsSourceMapsEnabled': 'true',
            
            # Elements panel
            'elements.styles.sidebar.width': '{"vertical":{"size":0,"showMode":"OnlyMain"}}',
            
            # Inspector versioning
            'inspectorVersion': '37',
            
            # Selected panel
            'panel-selected-tab': '"network"',          # Last opened panel
            
            # Request info expanded categories
            'request-info-general-category-expanded': 'true',
            'request-info-request-headers-category-expanded': 'true',
            'request-info-response-headers-category-expanded': 'true'
        },
        'synced_preferences_sync_disabled': {
            'adorner-settings': '[{"adorner":"grid","isEnabled":true},{"adorner":"flex","isEnabled":true}]',
            'syncedInspectorVersion': '37'
        }
    },
    
    # GCM (Google Cloud Messaging)
    'gcm': {
        'product_category_for_subtypes': 'com.chrome.linux'  # com.chrome.windows, com.chrome.macos
    }
}
```

!!! tip "DevTools Preferences Format"
    DevTools preferences use a unique format where boolean and string values are stored as **JSON-encoded strings** (e.g., `'true'` not `True`, `'"dark"'` not `'dark'`). This is because DevTools settings are serialized directly to JSON.
    
    For complex objects, double-encode:
    ```python
    import json
    
    # Create the object
    split_view = {'vertical': {'size': 0}}
    
    # Double-encode for DevTools
    devtools_value = json.dumps(json.dumps(split_view))
    # Result: '"{\\"vertical\\":{\\"size\\":0}}"'
    ```

### Sync & Sign-In Control

```python
import time
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.browser_preferences = {
    'signin': {
        'allowed': True,                        # Allow sign-in to Google
        'cookie_clear_on_exit_migration_notice_complete': True
    },
    
    'sync': {
        'data_type_status_for_sync_to_signin': {
            'bookmarks': False,
            'history': False,
            'passwords': False,
            'preferences': False
        },
        'encryption_bootstrap_token_per_account_migration_done': True,
        'passwords_per_account_pref_migration_done': True,
        'feature_status_for_sync_to_signin': 5
    },
    
    # Google services
    'google': {
        'services': {
            'signin_scoped_device_id': '<your-device-id>'  # Generate unique ID
        }
    },
    
    # GAIA (Google Accounts Infrastructure)
    'gaia_cookie': {
        'changed_time': str(int(time.time())),
        'hash': '',
        'last_list_accounts_data': '[]'
    }
}
```

### Optimization & Performance Tracking

```python
import time
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.browser_preferences = {
    # Optimization guide (Google's performance hints)
    'optimization_guide': {
        'hintsfetcher': {
            'hosts_successfully_fetched': {}
        },
        'predictionmodelfetcher': {
            'last_fetch_attempt': str(int(time.time())),
            'last_fetch_success': str(int(time.time()))
        },
        'previously_registered_optimization_types': {}
    },
    
    # History clusters (grouping related browsing)
    'history_clusters': {
        'all_cache': {
            'all_keywords': {},
            'all_timestamp': str(int(time.time()))
        },
        'last_selected_tab': 0,
        'short_cache': {
            'short_keywords': {},
            'short_timestamp': '0'
        }
    },
    
    # Domain diversity metrics
    'domain_diversity': {
        'last_reporting_timestamp': str(int(time.time()))
    },
    
    # Segmentation platform (user behavior analysis)
    'segmentation_platform': {
        'device_switcher_util': {
            'result': {
                'labels': ['NotSynced']
            }
        },
        'last_db_compaction_time': str(int(time.time()))
    },
    
    # Zero suggest (omnibox predictions)
    'zerosuggest': {
        'cachedresults': '',
        'cachedresults_with_url': {}
    }
}
```

!!! info "Performance Tracking Preferences"
    These preferences are typically used by Chrome to track and optimize performance. For automation, you can leave them empty or set realistic values to appear more like a normal browser.

### Session Events & Crash Handling

Chrome tracks session history for recovery and telemetry:

```python
import time
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.browser_preferences = {
    'sessions': {
        'event_log': [
            {
                'crashed': False,
                'time': str(int(time.time() * 1000000) + 11644473600000000),
                'type': 0                   # 0=session start
            },
            {
                'crashed': False,
                'did_schedule_command': True,
                'first_session_service': True,
                'tab_count': 1,
                'time': str(int(time.time() * 1000000) + 11644473600000000),
                'type': 2,                  # 2=session data saved
                'window_count': 1
            }
        ],
        'session_data_status': 3            # 0=unknown, 1=no data, 2=some data, 3=full data
    },
    
    # Profile exit type (important for fingerprinting)
    'profile': {
        'exit_type': 'Crashed'              # 'Normal', 'Crashed', 'SessionEnded'
    }
}
```

!!! warning "Crashed vs Normal"
    Most real browsers **crash occasionally**. Always showing `'Normal'` exit is suspicious.
    
    **Realistic strategy**: Set `'Crashed'` for ~10-20% of profiles to simulate normal user experience. Ironically, having occasional "crashes" makes your automation look more human.

!!! tip "Session Event Types"
    - **Type 0**: Session start
    - **Type 1**: Session ended normally
    - **Type 2**: Session data saved (tabs, windows)
    - **Type 3**: Session restored
    
    The `event_log` builds a history of browser sessions over time.

## Stealth & Fingerprinting

Creating a realistic browser fingerprint is crucial for avoiding bot detection systems. This section covers both basic and advanced techniques.

### Quick Stealth Setup

For most use cases, this simple configuration provides good anti-detection:

```python
import asyncio
import time
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def quick_stealth():
    options = ChromiumOptions()
    
    # Simulate a 60-day-old browser
    fake_timestamp = int(time.time()) - (60 * 24 * 60 * 60)
    
    options.browser_preferences = {
        # Fake usage history
        'profile': {
            'last_engagement_time': fake_timestamp,
            'exited_cleanly': True,
            'exit_type': 'Normal'
        },
        
        # Realistic homepage
        'homepage': 'https://www.google.com',
        'session': {
            'restore_on_startup': 1,
            'startup_urls': ['https://www.google.com']
        },
        
        # Enable features real users have
        'enable_do_not_track': False,  # Most users don't enable this
        'safebrowsing': {'enabled': True},
        'autofill': {'enabled': True},
        'search': {'suggest_enabled': True},
        'dns_prefetching': {'enabled': True}
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://bot-detection-site.com')
        print("Stealth mode activated!")

asyncio.run(quick_stealth())
```

!!! tip "Key Stealth Principles"
    **Enable, don't disable**: Real users have Safe Browsing, autofill, and search suggestions enabled. Disabling everything looks suspicious.
    
    **Age your profile**: Fresh installs are a red flag. Simulate a browser that's been used for weeks or months.
    
    **Match the majority**: Use default settings that 90% of users have, not privacy-focused configurations.

### Advanced Fingerprinting

For maximum realism, simulate detailed browser usage history:

```python
import time
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

def create_realistic_browser() -> ChromiumOptions:
    """Create a browser with comprehensive fingerprinting resistance."""
    options = ChromiumOptions()
    
    # Timestamps
    current_time = int(time.time())
    install_time = current_time - (90 * 24 * 60 * 60)  # 90 days ago
    last_use = current_time - (3 * 60 * 60)            # 3 hours ago
    
    options.browser_preferences = {
        # Profile metadata (critical for fingerprinting)
        'profile': {
            'created_by_version': '130.0.6723.91',      # Must match your Chrome version
            'creation_time': str(install_time),
            'last_engagement_time': str(last_use),
            'exit_type': 'Crashed',                     # 'Normal', 'Crashed', 'SessionEnded'
            'name': 'Pessoa 1',                         # Realistic profile name
            'avatar_index': 26,                         # 0-26 available avatars
            
            # Realistic content settings
            'default_content_setting_values': {
                'cookies': 1,
                'images': 1,
                'javascript': 1,
                'popups': 0,
                'notifications': 2,
                'geolocation': 0,           # Ask (not block)
                'media_stream': 0           # Ask (realistic)
            },
            
            'password_manager_enabled': False,
            'cookie_controls_mode': 0,
            'content_settings': {
                'pref_version': 1,
                'enable_quiet_permission_ui': {
                    'notifications': False
                },
                'enable_quiet_permission_ui_enabling_method': {
                    'notifications': 1
                }
            },
            
            # Security metadata
            'family_member_role': 'not_in_family',
            'managed_user_id': '',
            'were_old_google_logins_removed': True
        },
        
        # Browser usage metadata
        'browser': {
            'has_seen_welcome_page': True,
            'window_placement': {
                'work_area_bottom': 1080,
                'work_area_left': 0,
                'work_area_right': 1920,
                'work_area_top': 0
            }
        },
        
        # Installation metadata
        'countryid_at_install': 16978,              # Varies by country
        'default_apps_install_state': 3,
        
        # Extensions metadata
        'extensions': {
            'last_chrome_version': '130.0.6723.91',  # Must match your version
            'alerts': {'initialized': True},
            'theme': {'system_theme': 2}
        },
        
        # Session activity (shows regular usage)
        'in_product_help': {
            'session_start_time': str(current_time),
            'session_last_active_time': str(current_time),
            'recent_session_start_times': [
                str(current_time - (24 * 60 * 60)),
                str(current_time - (48 * 60 * 60)),
                str(current_time - (72 * 60 * 60))
            ]
        },
        
        # Session restore
        'session': {
            'restore_on_startup': 1,
            'startup_urls': ['https://www.google.com']
        },
        
        # Homepage
        'homepage': 'https://www.google.com',
        'homepage_is_newtabpage': False,
        
        # Translation history (shows multilingual usage)
        'translate': {'enabled': True},
        'translate_accepted_count': {'es': 2, 'fr': 1},
        'translate_denied_count_for_language': {'en': 1},
        
        # Spell check
        'spellcheck': {
            'dictionaries': ['en-US', 'pt-BR'],
            'dictionary': ''
        },
        
        # Languages
        'intl': {
            'selected_languages': 'en-US,en,pt-BR'
        },
        
        # Sign-in metadata
        'signin': {
            'allowed': True,
            'cookie_clear_on_exit_migration_notice_complete': True
        },
        
        # Safe Browsing (most users have this)
        'safebrowsing': {
            'enabled': True,
            'enhanced': False
        },
        
        # Autofill (common for real users)
        'autofill': {
            'enabled': True,
            'profile_enabled': True
        },
        
        # Search suggestions
        'search': {'suggest_enabled': True},
        
        # DNS prefetch
        'dns_prefetching': {'enabled': True},
        
        # Do NOT Track (usually off)
        'enable_do_not_track': False,
        
        # WebRTC (default settings)
        'webrtc': {
            'ip_handling_policy': 'default',
            'multiple_routes_enabled': True
        },
        
        # Privacy Sandbox (Google's cookie replacement - realistic users have this)
        'privacy_sandbox': {
            'first_party_sets_data_access_allowed_initialized': True,
            'm1': {
                'ad_measurement_enabled': True,
                'fledge_enabled': True,
                'row_notice_acknowledged': True,
                'topics_enabled': True
            }
        },
        
        # Media engagement
        'media': {
            'engagement': {'schema_version': 5}
        },
        
        # Web apps
        'web_apps': {
            'did_migrate_default_chrome_apps': ['app-id'],
            'last_preinstall_synchronize_version': '130'
        }
    }
    
    return options

# Usage
async def advanced_stealth():
    options = create_realistic_browser()
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://advanced-bot-detection.com')
        # Browser appears as a genuine 90-day-old installation
```

!!! warning "Version Consistency is Critical"
    **Always match Chrome versions**: Ensure `profile.created_by_version` and `extensions.last_chrome_version` match your actual Chrome version. Mismatched versions are an instant red flag.
    
    ```python
    # Get your Chrome version programmatically:
    async with Chrome() as browser:
        tab = await browser.start()
        version = await browser.get_version()
        chrome_version = version['product'].split('/')[1]  # e.g., '130.0.6723.91'
        print(f"Use this version: {chrome_version}")
    ```

!!! info "What Fingerprinting Preferences Do"
    **Profile age**: `creation_time` and `last_engagement_time` prove the browser isn't a fresh install.
    
    **Usage history**: `recent_session_start_times` shows regular browsing patterns.
    
    **Translation history**: `translate_accepted_count` indicates a real person using multiple languages.
    
    **Window placement**: Realistic screen dimensions that match actual monitor resolutions.
    
    **Privacy Sandbox**: Google's new tracking system. Disabling it is unusual and suspicious.

## Performance Impact

Understanding the performance implications of browser preferences helps you optimize for your specific use case:

| Preference Category | Expected Impact | Use Case |
|---------------------|----------------|----------|
| Disable images | 50-70% faster loads | Scraping text content |
| Disable prefetch | 10-20% faster loads | Reduce bandwidth usage |
| Disable plugins | 5-10% faster loads | Security and performance |
| Block notifications | Eliminates popups | Clean automation |
| Silent downloads | Eliminates prompts | Automated file downloads |

!!! tip "Speed vs Stealth Trade-off"
    **For speed**: Disable images, prefetch, plugins, and spell check.
    
    **For stealth**: Enable Safe Browsing, autofill, search suggestions, and DNS prefetch (even though they slow things down).
    
    **Balanced approach**: Enable stealth features but disable images and plugins. This gives 40-50% speedup while maintaining realistic fingerprint.

## See Also

- **[Deep Dive: Browser Preferences](../../deep-dive/browser-preferences.md)** - Architectural details and internals
- **[Page Load State](page-load-state.md)** - Control when pages are considered loaded
- **[Proxy Configuration](proxy.md)** - Configure network proxies
- **[Cookies & Sessions](../browser-management/cookies-sessions.md)** - Manage browser state
- **[Chromium Source: pref_names.cc](https://chromium.googlesource.com/chromium/src/+/main/chrome/common/pref_names.cc)** - Official preference constants
- **[Chromium Source: pref_names.h](https://github.com/chromium/chromium/blob/main/chrome/common/pref_names.h)** - Header file with definitions

Custom browser preferences give you unprecedented control over browser behavior, enabling sophisticated automation, performance optimization, and privacy configuration that simply isn't possible with traditional automation tools. This level of access transforms Pydoll from a simple automation library into a complete browser control system.


================================================
FILE: docs/en/features/configuration/proxy.md
================================================
# Proxy Configuration

Proxies are essential for professional web automation, enabling you to bypass rate limits, access geo-restricted content, and maintain anonymity. Pydoll provides native proxy support with automatic authentication handling.

!!! info "Related Documentation"
    - **[Browser Options](browser-options.md)** - Command-line proxy arguments
    - **[Request Interception](../network/interception.md)** - How proxy authentication works internally
    - **[Stealth Automation](../automation/human-interactions.md)** - Combine proxies with anti-detection
    - **[Proxy Architecture Deep Dive](../../deep-dive/proxy-architecture.md)** - Network fundamentals, protocols, security, and building your own proxy

## Why Use Proxies?

Proxies provide critical capabilities for automation:

| Benefit | Description | Use Case |
|---------|-------------|----------|
| **IP Rotation** | Distribute requests across multiple IPs | Avoid rate limits, scrape at scale |
| **Geographic Access** | Access region-locked content | Test geo-targeted features, bypass restrictions |
| **Anonymity** | Hide your real IP address | Privacy-focused automation, competitor analysis |
| **Load Distribution** | Spread traffic across multiple endpoints | High-volume scraping, stress testing |
| **Ban Avoidance** | Prevent permanent IP bans | Long-running automation, aggressive scraping |

!!! tip "When to Use Proxies"
    **Always use proxies for:**
    
    - Production web scraping (>100 requests/hour)
    - Accessing geo-restricted content
    - Bypassing rate limits or IP-based blocks
    - Testing from different regions
    - Maintaining anonymity
    
    **You may skip proxies for:**
    
    - Local development and testing
    - Internal/corporate automation
    - Low-volume automation (<50 requests/day)
    - When scraping your own infrastructure

## Proxy Types

Different proxy protocols serve different purposes:

| Type | Port | Authentication | Speed | Security | Use Case |
|------|------|----------------|-------|----------|----------|
| **HTTP** | 80, 8080 | Optional | Fast | Low | Basic web scraping, non-sensitive data |
| **HTTPS** | 443, 8443 | Optional | Fast | Medium | Secure web scraping, encrypted traffic |
| **SOCKS5** | 1080, 1081 | Optional | Medium | High | Full TCP/UDP support, advanced use cases |

### HTTP/HTTPS Proxies

Standard web proxies, ideal for most automation tasks:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def http_proxy_example():
    options = ChromiumOptions()
    
    # HTTP proxy (unencrypted)
    options.add_argument('--proxy-server=http://proxy.example.com:8080')
    
    # Or HTTPS proxy (encrypted)
    # options.add_argument('--proxy-server=https://proxy.example.com:8443')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # All traffic goes through proxy
        await tab.go_to('https://httpbin.org/ip')
        
        # Verify proxy IP
        ip = await tab.execute_script('return document.body.textContent')
        print(f"Current IP: {ip}")

asyncio.run(http_proxy_example())
```

**Pros:**

- Fast and efficient
- Wide support across services
- Easy to configure

**Cons:**

- HTTP: No encryption (traffic visible to proxy)
- Can be detected more easily than SOCKS5

### SOCKS5 Proxies

Advanced proxies with full TCP/UDP support:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def socks5_proxy_example():
    options = ChromiumOptions()
    
    # SOCKS5 proxy
    options.add_argument('--proxy-server=socks5://proxy.example.com:1080')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://httpbin.org/ip')

asyncio.run(socks5_proxy_example())
```

**Pros:**

- Protocol-agnostic (works with any TCP/UDP traffic)
- Better for advanced use cases (WebSockets, WebRTC)
- More stealthy (harder to detect)

**Cons:**

- Slightly slower than HTTP/HTTPS
- Less common in free/cheap proxy services

!!! info "SOCKS4 vs SOCKS5"
    **SOCKS5** is recommended over SOCKS4 because it:
    
    - Supports authentication (username/password)
    - Handles UDP traffic (for WebRTC, DNS, etc.)
    - Provides better error handling
    
    Use `socks5://` unless you specifically need SOCKS4 (`socks4://`).

## Authenticated Proxies

Pydoll automatically handles proxy authentication without manual intervention.

### How Authentication Works

When you provide credentials in the proxy URL, Pydoll:

1. **Intercepts the authentication challenge** using the Fetch domain
2. **Automatically responds** with credentials
3. **Continues navigation** sea@mlessly

This happens transparently, you don't need to handle authentication manually!

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def authenticated_proxy_example():
    options = ChromiumOptions()
    
    # Proxy with authentication (username:password)
    options.add_argument('--proxy-server=http://user:pass@proxy.example.com:8080')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Authentication handled automatically!
        await tab.go_to('https://example.com')
        print("Connected through authenticated proxy")

asyncio.run(authenticated_proxy_example())
```

!!! tip "Credential Format"
    Include credentials directly in the proxy URL:

    - HTTP: `http://username:password@host:port`
    - HTTPS: `https://username:password@host:port`
    - SOCKS5: `socks5://username:password@host:port`

    Pydoll automatically extracts and uses these credentials.

!!! warning "SOCKS5 Authentication Limitation"
    **Chrome does not support SOCKS5 authentication natively** ([Chromium Issue #40323993](https://issues.chromium.org/issues/40323993)). Credentials embedded in `socks5://user:pass@host:port` are silently ignored — Chrome only sends a "no authentication" greeting to the SOCKS5 proxy.

    This means Pydoll's automatic proxy auth (via `Fetch.authRequired`) **does not work for SOCKS5**, because Chrome never issues an HTTP 407 challenge for SOCKS5 connections.

    **Workaround — Local proxy forwarder:**

    Run a local SOCKS5 proxy (no auth) that forwards to the remote authenticated proxy. Pydoll provides a ready-to-use script for this:

    ```python
    import asyncio
    from pydoll.utils import SOCKS5Forwarder
    from pydoll.browser.chromium import Chrome
    from pydoll.browser.options import ChromiumOptions

    async def main():
        forwarder = SOCKS5Forwarder(
            remote_host='proxy.example.com',
            remote_port=1080,
            username='myuser',
            password='mypass',
            local_port=1081,
        )
        async with forwarder:
            options = ChromiumOptions()
            options.add_argument('--proxy-server=socks5://127.0.0.1:1081')

            async with Chrome(options=options) as browser:
                tab = await browser.start()
                await tab.go_to('https://httpbin.org/ip')

    asyncio.run(main())
    ```

    The forwarder handles the username/password handshake with the remote proxy while Chrome connects to localhost without authentication.

    For the full technical explanation of why this happens, see **[SOCKS5 Authentication Deep Dive](../../deep-dive/network/socks-proxies.md#socks5-authentication-and-chrome)**.

### Authentication Implementation Details

Pydoll uses Chrome's **Fetch domain** at the browser level to intercept and handle authentication challenges:

```python
# This is handled internally by Pydoll
# You don't need to write this code!

async def _handle_proxy_auth(event):
    """Pydoll's internal proxy authentication handler."""
    if event['params']['authChallenge']['source'] == 'Proxy':
        await browser.continue_request_with_auth(
            request_id=event['params']['requestId'],
            username='user',
            password='pass'
        )
```

!!! info "Under the Hood"
    For technical details on how Pydoll intercepts and handles proxy authentication, see:
    
    - **[Request Interception](../network/interception.md)** - Fetch domain and request handling
    - **[Event System](../advanced/event-system.md)** - Event-driven authentication

!!! warning "Fetch Domain Conflicts"
    When using **authenticated proxies** + **tab-level request interception**, be aware:
    
    - Pydoll enables Fetch at the **Browser level** for proxy auth
    - If you enable Fetch at the **Tab level**, they share the same domain
    - **Solution**: Call `tab.go_to()` once before enabling tab-level interception
    
    ```python
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # 1. First navigation triggers proxy auth (Browser-level Fetch)
        await tab.go_to('https://example.com')
        
        # 2. Then enable tab-level interception safely
        await tab.enable_fetch_events()
        await tab.on('Fetch.requestPaused', my_interceptor)
        
        # 3. Continue with your automation
        await tab.go_to('https://example.com/page2')
    ```
    
    See [Request Interception - Proxy + Interception](../network/interception.md#private-proxy-request-interception-fetch) for details.

## Proxy Bypass List

Exclude specific domains from using the proxy:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def proxy_bypass_example():
    options = ChromiumOptions()
    
    # Use proxy for most traffic
    options.add_argument('--proxy-server=http://proxy.example.com:8080')
    
    # But bypass proxy for these domains
    options.add_argument('--proxy-bypass-list=localhost,127.0.0.1,*.local,internal.company.com')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Uses proxy
        await tab.go_to('https://external-site.com')
        
        # Bypasses proxy (direct connection)
        await tab.go_to('http://localhost:8000')
        await tab.go_to('http://internal.company.com')

asyncio.run(proxy_bypass_example())
```

**Bypass list patterns:**

| Pattern | Matches | Example |
|---------|---------|---------|
| `localhost` | Localhost only | `http://localhost` |
| `127.0.0.1` | Loopback IP | `http://127.0.0.1` |
| `*.local` | All `.local` domains | `http://server.local` |
| `internal.company.com` | Specific domain | `http://internal.company.com` |
| `192.168.1.*` | IP range | `http://192.168.1.100` |

!!! tip "When to Use Bypass List"
    Bypass proxy for:
    
    - **Local development servers** (`localhost`, `127.0.0.1`)
    - **Internal company resources** (VPN, intranet)
    - **Testing environments** (`.local`, `.test` domains)
    - **High-bandwidth resources** (when proxy is slow)

## PAC (Proxy Auto-Config)

Use a PAC file for complex proxy routing rules:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def pac_proxy_example():
    options = ChromiumOptions()
    
    # Load PAC file from URL
    options.add_argument('--proxy-pac-url=http://proxy.example.com/proxy.pac')
    
    # Or use local PAC file
    # options.add_argument('--proxy-pac-url=file:///path/to/proxy.pac')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')

asyncio.run(pac_proxy_example())
```

**Example PAC file:**

```javascript
function FindProxyForURL(url, host) {
    // Direct connection for local addresses
    if (isInNet(host, "192.168.0.0", "255.255.0.0") ||
        isInNet(host, "127.0.0.0", "255.0.0.0")) {
        return "DIRECT";
    }
    
    // Use specific proxy for certain domains
    if (dnsDomainIs(host, ".example.com")) {
        return "PROXY proxy1.example.com:8080";
    }
    
    // Default proxy for everything else
    return "PROXY proxy2.example.com:8080";
}
```

!!! info "PAC File Use Cases"
    PAC files are useful for:
    
    - **Complex routing rules** (domain-based, IP-based)
    - **Proxy failover** (try multiple proxies)
    - **Load balancing** (distribute across proxy pool)
    - **Enterprise environments** (centralized proxy management)

## Rotating Proxies

Rotate through multiple proxies for better distribution:

```python
import asyncio
from itertools import cycle
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def rotating_proxy_example():
    # List of proxies
    proxies = [
        'http://user:pass@proxy1.example.com:8080',
        'http://user:pass@proxy2.example.com:8080',
        'http://user:pass@proxy3.example.com:8080',
    ]
    
    # Cycle through proxies
    proxy_pool = cycle(proxies)
    
    # Scrape multiple URLs with different proxies
    urls = [
        'https://example.com/page1',
        'https://example.com/page2',
        'https://example.com/page3',
    ]
    
    for url in urls:
        # Get next proxy
        proxy = next(proxy_pool)
        
        # Configure options with this proxy
        options = ChromiumOptions()
        options.add_argument(f'--proxy-server={proxy}')
        
        # Use proxy for this browser instance
        async with Chrome(options=options) as browser:
            tab = await browser.start()
            await tab.go_to(url)
            
            title = await tab.execute_script('return document.title')
            print(f"[{proxy.split('@')[1]}] {url}: {title}")

asyncio.run(rotating_proxy_example())
```

!!! tip "Proxy Rotation Strategies"
    **Per-browser rotation** (above):

    - Each browser instance uses a different proxy
    - Best for isolation and avoiding session conflicts
    
    **Per-request rotation**:

    - More complex, requires request interception
    - See [Request Interception](../network/interception.md) for implementation

## Residential vs Datacenter Proxies

Understanding proxy types helps you choose the right service:

| Feature | Residential | Datacenter |
|---------|------------|------------|
| **IP Source** | Real residential ISPs | Data centers |
| **Legitimacy** | High (real users) | Low (known ranges) |
| **Detection Risk** | Very low | High |
| **Speed** | Medium (150-500ms) | Very fast (<50ms) |
| **Cost** | Expensive ($5-15/GB) | Cheap ($0.10-1/GB) |
| **Best For** | Anti-bot sites, e-commerce | APIs, internal tools |

### Residential Proxies

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def residential_proxy_example():
    """Use residential proxy for anti-bot sites."""
    options = ChromiumOptions()
    
    # Residential proxy with high trust score
    options.add_argument('--proxy-server=http://user:pass@residential.proxy.com:8080')
    
    # Combine with stealth options
    options.add_argument('--disable-blink-features=AutomationControlled')
    options.add_argument('--user-agent=Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/130.0.0.0 Safari/537.36')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Access protected site
        await tab.go_to('https://protected-site.com')
        print("Successfully accessed through residential proxy")

asyncio.run(residential_proxy_example())
```

**When to use Residential:**

- Sites with strong anti-bot protection (Cloudflare, DataDome)
- E-commerce scraping (Amazon, eBay, etc.)
- Social media automation
- Financial services
- Any site that actively blocks datacenter IPs

### Datacenter Proxies

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def datacenter_proxy_example():
    """Use fast datacenter proxy for APIs and unprotected sites."""
    options = ChromiumOptions()
    
    # Fast datacenter proxy
    options.add_argument('--proxy-server=http://user:pass@datacenter.proxy.com:8080')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Fast API scraping
        await tab.go_to('https://api.example.com/data')

asyncio.run(datacenter_proxy_example())
```

**When to use Datacenter:**

- Public APIs without rate limits
- Internal/corporate automation
- Sites without anti-bot measures
- High-volume, speed-critical scraping
- Development and testing

!!! warning "Proxy Quality Matters"
    **Bad proxies** cause more problems than they solve:
    
    - Slow response times (timeouts)
    - Connection failures (error rates)
    - Blacklisted IPs (immediate bans)
    - Leaked real IP (privacy breach)
    
    **Invest in quality proxies** from reputable providers. Free proxies are almost never worth it.

## Testing Your Proxy

Verify proxy configuration before running production automation:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def test_proxy():
    """Test proxy connection and configuration."""
    proxy_url = 'http://user:pass@proxy.example.com:8080'
    
    options = ChromiumOptions()
    options.add_argument(f'--proxy-server={proxy_url}')
    
    try:
        async with Chrome(options=options) as browser:
            tab = await browser.start()
            
            # Test 1: Connection
            print("Testing proxy connection...")
            await tab.go_to('https://httpbin.org/ip', timeout=10)
            
            # Test 2: IP verification
            print("Verifying proxy IP...")
            ip_response = await tab.execute_script('return document.body.textContent')
            print(f"[OK] Proxy IP: {ip_response}")
            
            # Test 3: Geographic location (if available)
            await tab.go_to('https://ipapi.co/json/')
            geo_data = await tab.execute_script('return document.body.textContent')
            print(f"[OK] Geographic data: {geo_data}")
            
            # Test 4: Speed test
            import time
            start = time.time()
            await tab.go_to('https://example.com')
            load_time = time.time() - start
            print(f"[OK] Load time: {load_time:.2f}s")
            
            if load_time > 5:
                print("[WARNING] Slow proxy response time")
            
            print("\n[SUCCESS] All proxy tests passed!")
            
    except asyncio.TimeoutError:
        print("[ERROR] Proxy connection timeout")
    except Exception as e:
        print(f"[ERROR] Proxy test failed: {e}")

asyncio.run(test_proxy())
```

## Further Reading

- **[Proxy Architecture Deep Dive](../../deep-dive/proxy-architecture.md)** - Network fundamentals, TCP/UDP, HTTP/2/3, SOCKS5 internals, security analysis, and building your own proxy server
- **[Browser Options](browser-options.md)** - Command-line arguments and configuration
- **[Request Interception](../network/interception.md)** - How proxy authentication works
- **[Browser Preferences](browser-preferences.md)** - Stealth and fingerprinting
- **[Contexts](../browser-management/contexts.md)** - Using different proxies per context

!!! tip "Start Simple"
    Begin with a simple proxy setup, test thoroughly, then add complexity (rotation, retry logic, monitoring) as needed. Quality proxies are more important than complex rotation strategies.
    
    For those interested in understanding proxies at a deeper level, the **[Proxy Architecture Deep Dive](../../deep-dive/proxy-architecture.md)** provides comprehensive coverage of network protocols, security considerations, and even guides you through building your own proxy server.


================================================
FILE: docs/en/features/core-concepts.md
================================================
# Core Concepts

Understanding what makes Pydoll different starts with its foundational design decisions. These aren't just technical choices, they directly impact how you write automation scripts, what problems you can solve, and how reliable your solutions will be.

## Zero WebDrivers

One of Pydoll's most significant advantages is the complete elimination of WebDriver dependencies. If you've ever fought with "chromedriver version doesn't match Chrome version" errors or dealt with mysterious driver crashes, you'll appreciate this approach.

### How It Works

Traditional browser automation tools like Selenium rely on WebDriver executables that act as intermediaries between your code and the browser. Pydoll takes a different path by connecting directly to browsers through the Chrome DevTools Protocol (CDP).

```mermaid
graph LR
    %% Pydoll Flow
    subgraph P["Pydoll Flow"]
        direction LR
        P1["💻 Your Code"] --> P2["🪄 Pydoll"]
        P2 --> P3["🌐 Browser (via CDP)"]
    end

    %% Traditional Selenium Flow
    subgraph S["Traditional Selenium Flow"]
        direction LR
        S1["💻 Your Code"] --> S2["🔌 WebDriver Client"]
        S2 --> S3["⚙️ WebDriver Executable"]
        S3 --> S4["🌐 Browser"]
    end

```

When you start a browser with Pydoll, here's what happens under the hood:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def main():
    # This creates a Browser instance
    browser = Chrome()
    
    # start() launches Chrome with --remote-debugging-port
    # and establishes a WebSocket connection to the CDP endpoint
    tab = await browser.start()
    
    # Now you can control the browser through CDP commands
    await tab.go_to('https://example.com')
    
    await browser.stop()

asyncio.run(main())
```

Behind the scenes, `browser.start()` does the following:

1. **Launches the browser process** with `--remote-debugging-port=<port>` flag
2. **Waits for the CDP server** to become available on that port
3. **Establishes a WebSocket connection** to `ws://localhost:<port>/devtools/...`
4. **Returns a Tab instance** ready for automation

!!! info "Want to Know More?"
    For technical details on how the browser process is managed internally, see the [Browser Domain](../../deep-dive/browser-domain.md#browser-process-manager) deep dive.

### Benefits You'll Notice

**No Version Management Headaches**
```python
# With Selenium, you might see:
# SessionNotCreatedException: This version of ChromeDriver only supports Chrome version 120

# With Pydoll, you just need Chrome installed:
async with Chrome() as browser:
    tab = await browser.start()  # Works with any Chrome version
```

**Simpler Setup**
```bash
# Selenium setup:
$ pip install selenium
$ brew install chromedriver  # or download, chmod +x, add to PATH...
$ chromedriver --version     # does it match your Chrome?

# Pydoll setup:
$ pip install pydoll-python  # That's it!
```

**More Reliable**

Without WebDriver as a middle layer, there are fewer points of failure. Your code communicates directly with the browser through a well-defined protocol that Chromium developers themselves use and maintain.

### CDP: The Protocol Behind the Magic

The Chrome DevTools Protocol isn't just for Pydoll; it's the same protocol that powers Chrome DevTools when you open the inspector. This means:

- **Battle-tested reliability**: Used by millions of developers daily
- **Rich capabilities**: Everything DevTools can do, Pydoll can do
- **Active development**: Google maintains and evolves CDP continuously

!!! tip "Deep Dive: Understanding CDP"
    For a comprehensive understanding of how CDP works and why it's superior to WebDriver, see our [Chrome DevTools Protocol](../../deep-dive/cdp.md) deep dive.

## Async-First Architecture

Pydoll isn't just async-compatible; it's designed from the ground up to leverage Python's `asyncio` framework. This isn't a checkbox feature; it's fundamental to how Pydoll achieves high performance.

!!! info "New to Async Programming?"
    If you're not familiar with Python's `async`/`await` syntax or asyncio concepts, we strongly recommend reading our [Understanding Async/Await](../../deep-dive/connection-layer.md#understanding-asyncawait) guide first. It explains the fundamentals with practical examples that will help you understand how Pydoll's async architecture works and why it's so powerful for browser automation.

### Why Async Matters for Browser Automation

Browser automation involves a lot of waiting: pages loading, elements appearing, network requests completing. Traditional synchronous tools waste CPU time during these waits. Async architecture lets you do useful work while waiting.

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def scrape_page(browser, url):
    """Scrape a single page."""
    tab = await browser.new_tab()
    await tab.go_to(url)
    title = await tab.execute_script('return document.title')
    await tab.close()
    return title

async def main():
    urls = [
        'https://example.com/page1',
        'https://example.com/page2',
        'https://example.com/page3',
    ]
    
    async with Chrome() as browser:
        await browser.start()
        
        # Process all URLs concurrently!
        titles = await asyncio.gather(
            *(scrape_page(browser, url) for url in urls)
        )
        
        print(titles)

asyncio.run(main())
```

In this example, instead of scraping pages one after another (which might take 3 × 2 seconds = 6 seconds), all three pages are scraped concurrently, taking roughly 2 seconds total.

### True Concurrency vs Threading

Unlike threading-based approaches, Pydoll's async architecture provides true concurrent execution without the complexity of thread management:

```mermaid
sequenceDiagram
    participant Main as Main Task
    participant Tab1 as Tab 1
    participant Tab2 as Tab 2
    participant Tab3 as Tab 3
    
    Main->>Tab1: go_to(url1)
    Main->>Tab2: go_to(url2)
    Main->>Tab3: go_to(url3)
    
    Note over Tab1,Tab3: All tabs navigate concurrently
    
    Tab1-->>Main: Page 1 loaded
    Tab2-->>Main: Page 2 loaded
    Tab3-->>Main: Page 3 loaded
    
    Main->>Main: Process results
```

### Modern Python Patterns

Pydoll embraces modern Python idioms throughout:

**Context Managers**
```python
# Automatic resource cleanup
async with Chrome() as browser:
    tab = await browser.start()
    # ... do work ...
# Browser is automatically stopped when exiting context
```

**Async Context Managers for Operations**
```python
# Wait for and handle downloads
async with tab.expect_download(keep_file_at='/downloads') as dl:
    await (await tab.find(text='Download PDF')).click()
    pdf_data = await dl.read_bytes()
```

!!! tip "Deep Dive"
    Want to understand how async operations work under the hood? Check out the [Connection Layer](../../deep-dive/connection-layer.md) deep dive for implementation details.

### Performance Implications

The async-first design delivers measurable performance improvements:

```python
import asyncio
import time
from pydoll.browser.chromium import Chrome

async def benchmark_concurrent():
    """Scrape 10 pages concurrently."""
    async with Chrome() as browser:
        await browser.start()
        
        start = time.time()
        tasks = [
            browser.new_tab(f'https://example.com/page{i}')
            for i in range(10)
        ]
        await asyncio.gather(*tasks)
        elapsed = time.time() - start
        
        print(f"10 pages loaded in {elapsed:.2f}s")
        # Typical result: ~2-3 seconds vs 20+ seconds sequentially

asyncio.run(benchmark_concurrent())
```

## Multi-Browser Support

Pydoll provides a unified API across all Chromium-based browsers. Write your automation once, run it anywhere.

### Supported Browsers

**Google Chrome**: Primary target with full feature support.
```python
from pydoll.browser.chromium import Chrome

async with Chrome() as browser:
    tab = await browser.start()
```

**Microsoft Edge**: Full support including Edge-specific features.
```python
from pydoll.browser.chromium import Edge

async with Edge() as browser:
    tab = await browser.start()
```

**Other Chromium Browsers**: Brave, Vivaldi, Opera, etc.
```python
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.binary_location = '/path/to/brave-browser'  # or any Chromium browser

async with Chrome(options=options) as browser:
    tab = await browser.start()
```

The key benefit: all Chromium-based browsers share the same API. Write your automation once, and it works across Chrome, Edge, Brave, or any other Chromium browser without code changes.

### Cross-Browser Testing

Test your automation across multiple browsers without changing code:

```python
import asyncio
from pydoll.browser.chromium import Chrome, Edge

async def test_login(browser_class, browser_name):
    """Test login flow in a specific browser."""
    async with browser_class() as browser:
        tab = await browser.start()
        await tab.go_to('https://app.example.com/login')
        
        await (await tab.find(id='username')).type_text('user@example.com')
        await (await tab.find(id='password')).type_text('password123')
        await (await tab.find(id='login-btn')).click()
        
        # Verify login success
        success = await tab.find(id='dashboard', raise_exc=False)
        print(f"{browser_name} login: {'✓' if success else '✗'}")

async def main():
    # Test in both Chrome and Edge
    await test_login(Chrome, "Chrome")
    await test_login(Edge, "Edge")

asyncio.run(main())
```

## Human-Like Behavior

Automated browsers are often detectable because they behave robotically. Pydoll includes built-in features to make interactions appear more human.

### Natural Typing

Real users don't type at perfectly consistent speeds. Pydoll's `type_text()` method includes randomized delays between keystrokes:

```python
# Type with human-like timing
username_field = await tab.find(id='username')
await username_field.type_text(
    'user@example.com',
    interval=0.1  # Average 100ms between keys, with randomization
)

# Faster typing (still human-like)
await username_field.type_text(
    'user@example.com',
    interval=0.05  # Faster but still varies
)

# Instant (robotic; use only when speed matters more than stealth)
await username_field.type_text(
    'user@example.com',
    interval=0
)
```

The `interval` parameter sets the average delay, but Pydoll adds random variance to make the timing more natural.

### Realistic Clicking

Clicks aren't just "fire and forget". Pydoll automatically dispatches all mouse events that a real user would trigger:

```python
button = await tab.find(id='submit-button')

# Default behavior: clicks center of element
# Automatically fires: mouseover, mouseenter, mousemove, mousedown, mouseup, click
await button.click()

# Click with offset (useful for avoiding detection on larger elements)
await button.click(offset_x=10, offset_y=5)
```

!!! info "Mouse Events"
    Pydoll dispatches the complete sequence of mouse events in the correct order, simulating how real browsers handle user clicks. This makes clicks more realistic compared to simple JavaScript `.click()` calls.

!!! warning "Detection Considerations"
    While human-like behavior helps avoid basic bot detection, sophisticated anti-automation systems use many signals. Combine these features with:
    
    - Realistic browser fingerprints (via browser preferences)
    - Proper proxy configuration
    - Reasonable delays between actions
    - Varied navigation patterns

## Event-Driven Design

Unlike traditional polling-based automation, Pydoll lets you react to browser events as they happen. This is more efficient and enables sophisticated interaction patterns.

### Real-Time Event Monitoring

Subscribe to browser events and execute callbacks when they fire:

```python
import asyncio
from functools import partial
from pydoll.browser.chromium import Chrome
from pydoll.protocol.page.events import PageEvent
from pydoll.protocol.network.events import NetworkEvent

async def main():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # React to page load events
        async def on_page_load(event):
            print(f"Page loaded: {await tab.current_url}")
        
        await tab.enable_page_events()
        await tab.on(PageEvent.LOAD_EVENT_FIRED, on_page_load)
        
        # Monitor network requests
        async def on_request(tab, event):
            url = event['params']['request']['url']
            if '/api/' in url:
                print(f"API call: {url}")
        
        await tab.enable_network_events()
        await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, partial(on_request, tab))
        
        # Navigate and watch events fire
        await tab.go_to('https://example.com')
        await asyncio.sleep(3)  # Let events process

asyncio.run(main())
```

### Event Categories

Pydoll exposes several CDP event domains that you can subscribe to:

| Domain | Example Events |
|--------|----------------|
| **Page Events** | Load completed, navigation, JavaScript dialogs |
| **Network Events** | Request sent, response received, WebSocket activity |
| **DOM Events** | DOM changes, attribute modifications |
| **Fetch Events** | Request paused, authentication required |
| **Runtime Events** | Console messages, exceptions |

### Practical Event-Driven Patterns

**Capture API Responses**
```python
import json
from functools import partial
from pydoll.protocol.network.events import NetworkEvent

api_data = []

async def capture_api(tab, event):
    url = event['params']['response']['url']
    if '/api/data' in url:
        request_id = event['params']['requestId']
        body = await tab.get_network_response_body(request_id)
        api_data.append(json.loads(body))

await tab.enable_network_events()
await tab.on(NetworkEvent.RESPONSE_RECEIVED, partial(capture_api, tab))

# Navigate and automatically capture API responses
await tab.go_to('https://app.example.com')
await asyncio.sleep(2)

print(f"Captured {len(api_data)} API responses")
```

**Wait for Specific Conditions**
```python
import asyncio
from functools import partial
from pydoll.protocol.network.events import NetworkEvent

async def wait_for_api_call(tab, endpoint):
    """Wait for a specific API endpoint to be called."""
    event_occurred = asyncio.Event()
    
    async def check_endpoint(tab, event):
        url = event['params']['request']['url']
        if endpoint in url:
            event_occurred.set()
    
    await tab.enable_network_events()
    callback_id = await tab.on(
        NetworkEvent.REQUEST_WILL_BE_SENT,
        partial(check_endpoint, tab),
        temporary=True  # Auto-remove after first trigger
    )

    await event_occurred.wait()
    print(f"API endpoint {endpoint} was called!")

# Usage
await wait_for_api_call(tab, '/api/users')
```

!!! info "Deep Dive: Event System Details"
    For a comprehensive guide to event handling, callback patterns, and performance considerations, see the [Event System](../../deep-dive/event-system.md) deep dive.

### Event Performance

Events are powerful but come with overhead. Best practices:

```python
# ✓ Good: Enable only what you need
await tab.enable_network_events()

# ✗ Avoid: Enabling all events unnecessarily
await tab.enable_page_events()
await tab.enable_network_events()
await tab.enable_dom_events()
await tab.enable_fetch_events()
await tab.enable_runtime_events()

# ✓ Good: Filter early in callbacks
async def handle_request(event):
    url = event['params']['request']['url']
    if '/api/' not in url:
        return  # Skip non-API requests early
    # Process API request...

# ✓ Good: Disable when done
await tab.disable_network_events()
```

## Bringing It All Together

These core concepts work together to create a powerful automation framework:

```python
import asyncio
import json
from functools import partial
from pydoll.browser.chromium import Chrome
from pydoll.protocol.network.events import NetworkEvent
from pydoll.constants import Keys

async def advanced_scraping():
    """Demonstrates multiple core concepts working together."""
    async with Chrome() as browser:  # Async context manager
        tab = await browser.start()
        
        # Event-driven: Capture API data
        api_responses = []
        
        async def capture_data(tab, event):
            url = event['params']['response']['url']
            if '/api/products' in url:
                request_id = event['params']['requestId']
                body = await tab.get_network_response_body(request_id)
                api_responses.append(json.loads(body))
        
        await tab.enable_network_events()
        await tab.on(NetworkEvent.RESPONSE_RECEIVED, partial(capture_data, tab))
        
        # Navigate with zero-webdriver simplicity
        await tab.go_to('https://example.com/products')
        
        # Human-like interaction
        search = await tab.find(id='search')
        await search.type_text('laptop', interval=0.1)  # Natural typing
        await search.press_keyboard_key(Keys.ENTER)
        
        # Wait for API responses (async efficiency)
        await asyncio.sleep(2)
        
        print(f"Captured {len(api_responses)} products from API")
        return api_responses

# Multi-browser support: works with Chrome, Edge, etc.
asyncio.run(advanced_scraping())
```

These foundational concepts inform everything else in Pydoll. As you explore specific features, you'll see these principles in action, working together to create reliable, efficient, and maintainable browser automation.

---

## What's Next?

Now that you understand Pydoll's core design, you're ready to explore specific features:

- **[Element Finding](element-finding.md)** - Learn Pydoll's intuitive element location APIs
- **[Network Features](../network/monitoring.md)** - Leverage the event system for network analysis
- **[Browser Management](../browser-management/tabs.md)** - Use async patterns for concurrent operations

For deeper technical understanding, explore the [Deep Dive](../../deep-dive/index.md) section.


================================================
FILE: docs/en/features/element-finding.md
================================================
# Element Finding

Finding elements on a web page is the foundation of browser automation. Pydoll introduces a revolutionary, intuitive approach that makes element location both more powerful and easier to use than traditional selector-based methods.

## Why Pydoll's Approach is Different

Traditional browser automation tools force you to think in terms of CSS selectors and XPath expressions from the start. Pydoll inverts this: you describe what you're looking for using natural HTML attributes, and Pydoll figures out the optimal selector strategy.

```python
# Traditional approach (other tools)
element = driver.find_element(By.XPATH, "//input[@type='email' and @name='username']")

# Pydoll's approach
element = await tab.find(tag_name="input", type="email", name="username")
```

Both find the same element, but Pydoll's syntax is clearer, more maintainable, and less error-prone.

### Element Finding Methods Overview

Pydoll offers three main approaches to find elements:

| Method | Use When | Example |
|--------|----------|---------|
| **`find()`** | You know HTML attributes | `await tab.find(id="username")` |
| **`query()`** | You have CSS/XPath selector | `await tab.query("div.content")` |
| **Traversal** | You want to explore from a known element | `await element.get_children_elements()` |

```mermaid
flowchart LR
    A[Need Element?] --> B{What do you have?}
    B -->|HTML Attributes| C[find method]
    B -->|CSS/XPath| D[query method]
    B -->|Parent Element| E[Traversal]
    
    C --> F[WebElement]
    D --> F
    E --> G[List of WebElements]
```

!!! info "Deep Dive: How It Works"
    Curious about how Pydoll implements element finding under the hood? Check out the [FindElements Mixin](../deep-dive/find-elements-mixin.md) documentation to learn about the architecture, performance optimizations, and internal selector strategies.

## The find() Method: Natural Element Selection

The `find()` method is your primary tool for locating elements. It accepts common HTML attributes as parameters and automatically builds the most efficient selector.

### Basic Usage

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def basic_finding():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # Find by ID (most common and fastest)
        username = await tab.find(id="username")
        
        # Find by class name
        submit_button = await tab.find(class_name="btn-primary")
        
        # Find by tag name
        first_paragraph = await tab.find(tag_name="p")
        
        # Find by name attribute
        email_field = await tab.find(name="email")
        
        # Find by text content
        login_link = await tab.find(text="Login")

asyncio.run(basic_finding())
```

### Combining Attributes for Precision

The real power of `find()` comes from combining multiple attributes to create precise selectors:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def precise_finding():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/form')
        
        # Combine tag name with type
        password_input = await tab.find(tag_name="input", type="password")
        
        # Combine tag, class, and custom attributes
        submit_button = await tab.find(
            tag_name="button",
            class_name="btn",
            type="submit"
        )
        
        # Use data attributes
        product_card = await tab.find(
            tag_name="div",
            data_testid="product-card",
            data_category="electronics"
        )
        
        # Combine multiple conditions
        specific_link = await tab.find(
            tag_name="a",
            class_name="nav-link",
            href="/dashboard"
        )

asyncio.run(precise_finding())
```

!!! info "Combination Logic: AND"
    Combining attributes in `find()` works as an AND operation. The element must match **all** provided attributes.
    
    For more complex scenarios requiring OR logic—like finding an element that may have either an `id` or a different `name`—the correct approach is to chain multiple `find()` calls, as demonstrated in the "Complete Example" section.

!!! tip "Attribute Naming Convention"
    Use underscores for attribute names with hyphens. For example, `data-testid` becomes `data_testid`, and `aria-label` becomes `aria_label`. Pydoll automatically converts them to the correct format.

### How find() Selects the Optimal Strategy

Pydoll automatically chooses the most efficient selector based on the attributes you provide:

| Attributes Provided | Strategy Used | Performance |
|---------------------|---------------|-------------|
| Single: `id` | `By.ID` | ⚡ Fastest |
| Single: `class_name` | `By.CLASS_NAME` | ⚡ Fast |
| Single: `name` | `By.NAME` | ⚡ Fast |
| Single: `tag_name` | `By.TAG_NAME` | ⚡ Fast |
| Single: `text` | `By.XPATH` | ⚡ Fast |
| Multiple attributes | XPath Expression | ✓ Efficient |

```mermaid
flowchart LR
    A[find attributes] --> B{Single or Multiple?}
    B -->|Single| C[Direct Selector]
    B -->|Multiple| D[Build XPath]
    C --> E[Fast Execution]
    D --> E
```

### Finding Multiple Elements

Use `find_all=True` to get a list of all matching elements:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def find_multiple():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/products')
        
        # Find all product cards
        products = await tab.find(class_name="product-card", find_all=True)
        print(f"Found {len(products)} products")
        
        # Find all links in navigation
        nav_links = await tab.find(
            tag_name="a",
            class_name="nav-link",
            find_all=True
        )
        
        # Process each element
        for link in nav_links:
            text = await link.text
            href = await link.get_attribute("href")
            print(f"Link: {text} → {href}")

asyncio.run(find_multiple())
```

### Waiting for Dynamic Elements

Modern web applications load content dynamically. Use `timeout` to wait for elements to appear:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def wait_for_elements():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/dashboard')
        
        # Wait up to 10 seconds for element to appear
        dynamic_content = await tab.find(
            class_name="dynamic-content",
            timeout=10
        )
        
        # Wait for AJAX-loaded data
        user_profile = await tab.find(
            id="user-profile",
            timeout=15
        )
        
        # Handle elements that might not appear
        optional_banner = await tab.find(
            class_name="promo-banner",
            timeout=3,
            raise_exc=False  # Returns None if not found
        )
        
        if optional_banner:
            await optional_banner.click()
        else:
            print("No promotional banner present")

asyncio.run(wait_for_elements())
```

!!! warning "Timeout Best Practices"
    Use reasonable timeout values. Too short and you'll miss slow-loading elements; too long and you'll waste time waiting for elements that don't exist. Start with 5-10 seconds for most dynamic content.

## The query() Method: Direct Selector Access

For developers who prefer traditional selectors or need more complex selection logic, the `query()` method provides direct access to CSS selectors and XPath expressions.

### CSS Selectors

CSS selectors are fast, widely understood, and perfect for most use cases:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def css_selector_examples():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # Simple selectors
        main_nav = await tab.query("nav.main-menu")
        first_article = await tab.query("article:first-child")
        
        # Attribute selectors
        submit_button = await tab.query("button[type='submit']")
        required_inputs = await tab.query("input[required]", find_all=True)
        
        # Complex selectors
        nested = await tab.query("div.container > .content .item:nth-child(2)")
        
        # Pseudo-classes
        first_enabled_button = await tab.query("button:not([disabled])")

asyncio.run(css_selector_examples())
```

### XPath Expressions

XPath excels at complex relationships and text matching:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def xpath_examples():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/table')
        
        # Text matching
        button = await tab.query("//button[contains(text(), 'Submit')]")
        
        # Navigate to parent
        input_parent = await tab.query("//input[@name='email']/parent::div")
        
        # Find sibling elements
        label_input = await tab.query(
            "//label[text()='Email:']/following-sibling::input"
        )
        
        # Complex table queries
        edit_button = await tab.query(
            "//tr[td[text()='John Doe']]//button[@class='btn-edit']"
        )

asyncio.run(xpath_examples())
```

!!! info "CSS vs XPath: Which to Use?"
    For a comprehensive guide on choosing between CSS selectors and XPath, including syntax references and real-world examples, see the [Selectors Guide](../deep-dive/selectors-guide.md).

## DOM Traversal: Children and Siblings

Sometimes you need to explore the DOM tree from a known starting point. Pydoll provides dedicated methods for traversing element relationships.

### DOM Tree Structure

Understanding the DOM tree structure helps you choose the right traversal method:

```mermaid
graph TB
    Root[Document Root]
    Root --> Container[div id='container']
    
    Container --> Child1[div class='card']
    Container --> Child2[div class='card']
    Container --> Child3[div class='card']
    
    Child1 --> GrandChild1[h2 title]
    Child1 --> GrandChild2[p description]
    Child1 --> GrandChild3[button action]
    
    Child2 --> GrandChild4[h2 title]
    Child2 --> GrandChild5[p description]
    
    Child3 --> GrandChild6[h2 title]
```

### Getting Child Elements

The `get_children_elements()` method retrieves descendants of an element:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def traverse_children():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/cards')
        
        # Get container
        container = await tab.find(id="cards-container")
        
        # Get direct children only (max_depth=1)
        direct_children = await container.get_children_elements(max_depth=1)
        print(f"Container has {len(direct_children)} direct children")
        
        # Include grandchildren (max_depth=2)
        descendants = await container.get_children_elements(max_depth=2)
        print(f"Found {len(descendants)} elements up to 2 levels deep")
        
        # Filter by tag name
        links = await container.get_children_elements(
            max_depth=3,
            tag_filter=["a"]
        )
        print(f"Found {len(links)} links in container")
        
        # Combine filters for specific elements
        nav_links = await container.get_children_elements(
            max_depth=2,
            tag_filter=["a", "button"]
        )

asyncio.run(traverse_children())
```

### Getting Sibling Elements

The `get_siblings_elements()` method finds elements at the same level:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def traverse_siblings():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/list')
        
        # Find active item
        active_item = await tab.find(class_name="item-active")
        
        # Get all siblings (excluding active_item itself)
        all_siblings = await active_item.get_siblings_elements()
        print(f"Active item has {len(all_siblings)} siblings")
        
        # Filter siblings by tag
        link_siblings = await active_item.get_siblings_elements(
            tag_filter=["a"]
        )
        
        # Process sibling elements
        for sibling in all_siblings:
            text = await sibling.text
            print(f"Sibling: {text}")

asyncio.run(traverse_siblings())
```

!!! tip "Performance Considerations"
    DOM traversal can be expensive for large trees. Prefer shallow `max_depth` values and specific `tag_filter` parameters to minimize the number of nodes processed. For deeply nested structures, consider multiple targeted `find()` calls instead of a single deep traversal.

## Finding Elements Within Elements

Once you have an element, you can search within its scope using the same `find()` and `query()` methods.

!!! warning "Important: Search Depth Behavior"
    When you call `element.find()` or `element.query()`, Pydoll searches through **ALL descendants** (children, grandchildren, great-grandchildren, etc.), not just direct children. This is the standard behavior of `querySelector()` and matches what most developers expect.

### Understanding Search Scope

```mermaid
graph TB
    Container[div id='container']
    
    Container --> Child1[div class='card' ✓]
    Container --> Child2[div class='card' ✓]
    Container --> Child3[div class='other']
    
    Child1 --> GrandChild1[div class='card' ✓]
    Child1 --> GrandChild2[p class='text']
    
    Child3 --> GrandChild3[div class='card' ✓]
    Child3 --> GrandChild4[div class='card' ✓]
```

```python
# This finds ALL 5 elements with class='card' in the tree
# (2 direct children + 3 nested descendants)
cards = await container.find(class_name="card", find_all=True)
print(len(cards))  # Output: 5
```

### Basic Scoped Search

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def scoped_search():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/products')
        
        # Find a product container
        product_card = await tab.find(class_name="product-card")
        
        # Search within the product card (searches ALL descendants, returns only the first match)
        product_title = await product_card.find(class_name="title")
        product_price = await product_card.find(class_name="price")
        add_button = await product_card.find(tag_name="button", text="Add to Cart")
        
        # Query within scope
        product_image = await product_card.query("img.product-image")
        
        # Find all items within a container (ALL descendants)
        nav_menu = await tab.find(class_name="nav-menu")
        menu_items = await nav_menu.find(tag_name="li", find_all=True)
        
        print(f"Menu has {len(menu_items)} items")

asyncio.run(scoped_search())
```

### Finding Only Direct Children

If you need to find **only direct children** (depth 1), use CSS child combinator `>` or XPath:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def direct_children_only():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/cards')
        
        container = await tab.find(id="cards-container")
        
        # Method 1: CSS child combinator (>)
        # Finds ONLY direct children with class='card'
        direct_cards = await container.query("> .card", find_all=True)
        print(f"Direct children: {len(direct_cards)}")
        
        # Method 2: XPath direct child
        direct_divs = await container.query("./div[@class='card']", find_all=True)
        
        # Method 3: Use get_children_elements() with max_depth=1
        # (but this only filters by tag, not by other attributes)
        direct_children = await container.get_children_elements(
            max_depth=1,
            tag_filter=["div"]
        )
        
        # Then filter manually by class
        cards_only = [
            child for child in direct_children
            if 'card' in (await child.get_attribute('class') or '')
        ]

asyncio.run(direct_children_only())
```

### Comparison: find() vs get_children_elements()

| Feature | `find()` / `query()` | `get_children_elements()` |
|---------|---------------------|---------------------------|
| **Search Depth** | ALL descendants | Configurable with `max_depth` |
| **Filter By** | Any HTML attribute | Only tag name |
| **Use Case** | Find specific elements anywhere in subtree | Explore DOM structure, get direct children |
| **Performance** | Optimized for single attribute | Good for broad exploration |
| **Parameter** | `tag_name="a"` (string) | `tag_filter=["a"]` (list) |

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def comparison_example():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        container = await tab.find(id="container")
        
        # Scenario 1: I want ALL links anywhere in container
        # Use find() - searches all descendants
        all_links = await container.find(tag_name="a", find_all=True)
        
        # Scenario 2: I want ONLY direct child links
        # Use CSS child combinator
        direct_links = await container.query("> a", find_all=True)
        
        # Scenario 3: I want direct children with specific class
        # Use CSS child combinator
        direct_cards = await container.query("> .card", find_all=True)
        
        # Scenario 4: I want to explore the DOM structure
        # Use get_children_elements()
        direct_children = await container.get_children_elements(max_depth=1)
        
        # Scenario 5: I want all descendants up to depth 2, filtered by tag
        # Use get_children_elements()
        shallow_links = await container.get_children_elements(
            max_depth=2,
            tag_filter=["a"]
        )

asyncio.run(comparison_example())
```

!!! tip "When to Use Each Method"
    - **Use `find()`**: When you know the attributes (class, id, etc.) and want to search the entire subtree
    - **Use `query("> .class")`**: When you need only direct children with specific attributes
    - **Use `get_children_elements()`**: When exploring DOM structure or filtering by tag only

### Common Use Cases

This scoped searching is incredibly useful for working with repeating patterns like:

- Product cards in e-commerce sites
- Table rows with multiple cells
- Form sections with multiple fields
- Navigation menus with nested items

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def practical_example():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/products')
        
        # Find all product cards on the page
        product_cards = await tab.find(class_name="product-card", find_all=True)
        
        for card in product_cards:
            # Within each card, find ALL descendants with these classes
            title = await card.find(class_name="product-title")
            price = await card.find(class_name="product-price")
            
            # Get the button that's anywhere inside this card
            buy_button = await card.find(tag_name="button", text="Buy Now")
            
            title_text = await title.text
            price_text = await price.text
            
            print(f"Product: {title_text}, Price: {price_text}")
            
            # Click buy button
            await buy_button.click()

asyncio.run(practical_example())
```


## Shadow DOM Support

Many modern web applications use [Shadow DOM](https://developer.mozilla.org/en-US/docs/Web/API/Web_components/Using_shadow_DOM) to encapsulate component internals. Pydoll provides seamless access to elements inside shadow trees through the `ShadowRoot` class.

### How Shadow DOM Works

```mermaid
graph TB
    Host["div#my-component (shadow host)"]
    SR["ShadowRoot (open)"]
    Internal1["button.internal-btn"]
    Internal2["input.internal-input"]

    Host --> SR
    SR --> Internal1
    SR --> Internal2
```

Elements inside a shadow root are hidden from regular DOM queries. You need to first access the shadow root, then search within it.

### Accessing Shadow Roots

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def shadow_dom_example():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/web-components')

        # Find the shadow host element
        shadow_host = await tab.find(id='my-component')

        # Access its shadow root
        shadow_root = await shadow_host.get_shadow_root()

        # Find elements inside the shadow root using query() with CSS selectors
        button = await shadow_root.query('.internal-btn')
        await button.click()

        input_field = await shadow_root.query('input[type="email"]')
        await input_field.type_text('user@example.com')

asyncio.run(shadow_dom_example())
```

!!! warning "Use `query()` with CSS selectors inside shadow roots"
    `find()` and XPath are **not supported** on `ShadowRoot` and will raise `NotImplementedError`. Always use `query()` with CSS selectors to search inside shadow roots.

### query() with CSS Selectors

`ShadowRoot` supports `query()` with CSS selectors for element finding:

```python
# query() with CSS selectors
element = await shadow_root.query('#inner-id')
element = await shadow_root.query('button.primary')

# Complex selectors
element = await shadow_root.query('div.container > .content')

# find_all for multiple elements
items = await shadow_root.query('.item', find_all=True)

# Waiting with timeout
element = await shadow_root.query('#dynamic', timeout=5)
```

### Nested Shadow Roots

Web components can contain other web components with their own shadow roots:

```python
async def nested_shadow():
    outer_host = await tab.find(tag_name='outer-component')
    outer_shadow = await outer_host.get_shadow_root()

    inner_host = await outer_shadow.query('inner-component')
    inner_shadow = await inner_host.get_shadow_root()

    deep_button = await inner_shadow.query('.deep-btn')
    await deep_button.click()
```

### Finding Shadow Roots: find_shadow_roots()

When you need to explore which shadow roots exist on a page (useful for debugging or dynamic pages like Cloudflare challenges), use `find_shadow_roots()`:

```python
# Find all shadow roots in the page
shadow_roots = await tab.find_shadow_roots()

for sr in shadow_roots:
    print(f'Mode: {sr.mode}, Host: {sr.host_element}')
    # Search inside each shadow root
    btn = await sr.query('button', raise_exc=False)
    if btn:
        await btn.click()
```

#### Waiting for Shadow Roots: `timeout`

Shadow hosts are often injected asynchronously (e.g., Cloudflare Turnstile loading inside an OOPIF). Use `timeout` to poll until shadow roots appear:

```python
# Wait up to 10 seconds for shadow roots to appear
shadow_roots = await tab.find_shadow_roots(timeout=10)
```

The `get_shadow_root()` method on elements also supports `timeout`:

```python
# Wait for a shadow root to be attached to an element
host = await tab.find(id='my-component', timeout=5)
shadow = await host.get_shadow_root(timeout=5)
```

#### Deep Traversal: Cross-Origin IFrames (OOPIFs)

By default, `find_shadow_roots()` only traverses the main document's DOM tree (which includes same-origin iframes via `contentDocument` but **not** cross-origin iframes). Pass `deep=True` to also discover shadow roots inside cross-origin iframes (OOPIFs):

```python
# Include shadow roots from cross-origin iframes (e.g., Cloudflare Turnstile)
shadow_roots = await tab.find_shadow_roots(deep=True, timeout=10)

for sr in shadow_roots:
    print(f'Mode: {sr.mode}, Host: {sr.host_element}')
    # Elements found inside these shadow roots automatically route
    # CDP commands through the correct OOPIF session
    btn = await sr.query('input[type="checkbox"]', raise_exc=False)
    if btn:
        await btn.click()
```

!!! tip "When to use `deep=True`"
    Use `deep=True` when automating pages with cross-origin embedded widgets such as Cloudflare Turnstile captchas, third-party payment forms, or social login buttons. These widgets typically use cross-origin iframes with closed shadow roots inside them.

### Shadow Root Properties

```python
shadow_root = await element.get_shadow_root()

# Check the shadow root mode (open, closed, or user-agent)
print(shadow_root.mode)  # ShadowRootType.OPEN

# Access the host element
host = shadow_root.host_element

# Get the shadow root inner HTML
html = await shadow_root.inner_html
```

!!! note "Closed Shadow Roots"
    Closed shadow roots (`mode='closed'`) are accessible via CDP since the protocol bypasses JavaScript restrictions. However, some browser-internal shadow roots (user-agent) may have limited accessibility.

## Working with iFrames

!!! info "Complete IFrame Guide Available"
    This section covers basic iframe interaction for element finding. For a comprehensive guide including nested iframes, CAPTCHA handling, technical deep dives, and troubleshooting, see **[Working with IFrames](automation/iframes.md)**.

iFrames present a special challenge in browser automation because they have separate DOM contexts. Pydoll makes iframe interaction seamless:

```mermaid
flowchart TB
    Main[tab]
    Frame["iframe WebElement"]
    Content["elements inside iframe"]

    Main -->|"find('iframe')"| Frame
    Frame -->|"find('button#submit')"| Content
```
```python
import asyncio
from pydoll.browser.chromium import Chrome

async def iframe_interaction():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/page-with-iframe')

        iframe = await tab.query("iframe.embedded-content", timeout=10)

        # WebElement helpers run inside the iframe automatically
        iframe_button = await iframe.find(tag_name="button", class_name="submit")
        await iframe_button.click()

        iframe_input = await iframe.find(id="captcha-input")
        await iframe_input.type_text("verification-code")

        # Nested iframe? Keep chaining
        inner_iframe = await iframe.find(tag_name="iframe")
        download_link = await inner_iframe.find(text="Download PDF")
        await download_link.click()

asyncio.run(iframe_interaction())
```
!!! note "Screenshots in iframes"
    `tab.take_screenshot()` only works on the top-level target. Capture iframe content by targeting an element inside the frame and calling `element.take_screenshot()`.

## Error Handling Strategies

Robust automation requires handling cases where elements don't exist or take longer to appear than expected.

### Element Finding Flow with Error Handling

```mermaid
flowchart TB
    Start[Start Finding Element] --> Immediate[Try Immediate Find]
    
    Immediate --> Found1{Element Found?}
    Found1 -->|Yes| Return1[Return WebElement]
    Found1 -->|No & timeout=0| Check1{raise_exc=True?}
    Found1 -->|No & timeout>0| Wait[Start Waiting Loop]
    
    Check1 -->|Yes| Error1[Raise ElementNotFound]
    Check1 -->|No| ReturnNone[Return None]
    
    Wait --> Sleep[Wait 0.5 seconds]
    Sleep --> TryAgain[Try Finding Again]
    TryAgain --> Found2{Element Found?}
    
    Found2 -->|Yes| Return2[Return WebElement]
    Found2 -->|No| TimeCheck{Timeout Exceeded?}
    
    TimeCheck -->|No| Sleep
    TimeCheck -->|Yes| Check2{raise_exc=True?}
    
    Check2 -->|Yes| Error2[Raise WaitElementTimeout]
    Check2 -->|No| ReturnNone2[Return None]
```

### Using raise_exc Parameter

Control whether to raise an exception when elements aren't found:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.exceptions import ElementNotFound

async def error_handling():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # Raise exception if not found (default behavior)
        try:
            critical_element = await tab.find(id="must-exist")
        except ElementNotFound:
            print("Critical element missing! Cannot continue.")
            return
        
        # Return None if not found (optional elements)
        optional_banner = await tab.find(
            class_name="promo-banner",
            raise_exc=False
        )
        
        if optional_banner:
            print("Banner found, closing it")
            close_button = await optional_banner.find(class_name="close-btn")
            await close_button.click()
        else:
            print("No banner present, continuing")

asyncio.run(error_handling())
```

## Best Practices

### 1. Prefer Stable Selectors

Use attributes that are unlikely to change:

```python
# Good: Semantic attributes
await tab.find(id="user-profile")  # IDs are usually stable
await tab.find(data_testid="submit-button")  # Test IDs are designed for automation
await tab.find(name="username")  # Form names are stable

# Avoid: Structural dependencies
await tab.query("div > div > div:nth-child(3) > input")  # Brittle, breaks easily
```

### 2. Use the Simplest Selector That Works

Start simple and add complexity only when needed:

```python
# Good: Simple and clear
await tab.find(id="login-form")

# Unnecessary: Over-complicated
await tab.query("//div[@id='content']/descendant::form[@id='login-form']")
```

### 3. Choose the Right Method

- Use `find()` for simple attribute-based searches
- Use `query()` for complex CSS or XPath patterns
- Use traversal methods for exploring from known anchors

```python
# Use find() for straightforward cases
username = await tab.find(id="username")

# Use query() for complex patterns
active_nav_link = await tab.query("nav.menu a.active")

# Use traversal for relationship-based searches
container = await tab.find(id="cards")
child_links = await container.get_children_elements(tag_filter=["a"])
```

### 4. Add Meaningful Timeouts

Don't use zero timeouts for dynamic content, and don't wait forever for optional elements:

```python
# Good: Reasonable timeouts
critical_data = await tab.find(id="data", timeout=10)
optional_popup = await tab.find(class_name="popup", timeout=2, raise_exc=False)

# Bad: No timeout for dynamic content
dynamic_element = await tab.find(class_name="ajax-loaded")  # Will fail immediately

# Bad: Very long timeout for optional element
banner = await tab.find(class_name="ad-banner", timeout=60)  # Wastes time
```

### 5. Handle Errors Gracefully

Plan for elements that might not exist:

```python
# Critical elements: let exceptions bubble up
submit_button = await tab.find(id="submit-btn")

# Optional elements: handle explicitly
cookie_notice = await tab.find(class_name="cookie-notice", raise_exc=False)
if cookie_notice:
    accept_button = await cookie_notice.find(text="Accept")
    await accept_button.click()
```

## Complete Example: Form Automation

Here's a complete example combining multiple element finding techniques:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.exceptions import ElementNotFound

async def automate_registration_form():
    async with Chrome() as browser:
        tab = await browser.start()
        
        try:
            # Navigate to registration page
            await tab.go_to('https://example.com/register', timeout=10)
            
            # Handle optional cookie banner
            cookie_banner = await tab.find(
                class_name="cookie-banner",
                timeout=2,
                raise_exc=False
            )
            if cookie_banner:
                accept = await cookie_banner.find(text="Accept")
                await accept.click()
                await asyncio.sleep(1)
            
            # Fill out the registration form
            # Find form fields
            username_field = await tab.find(name="username", timeout=5)
            email_field = await tab.find(name="email")
            password_field = await tab.find(type="password", name="password")
            confirm_password = await tab.find(type="password", name="confirm_password")
            
            # Enter information
            await username_field.type_text("john_doe_2024", interval=0.1)
            await email_field.type_text("john@example.com", interval=0.1)
            await password_field.type_text("SecurePass123!", interval=0.1)
            await confirm_password.type_text("SecurePass123!", interval=0.1)
            
            # Find and check terms checkbox
            # Try multiple strategies
            terms_checkbox = await tab.find(id="terms", raise_exc=False)
            if not terms_checkbox:
                terms_checkbox = await tab.find(name="accept_terms", raise_exc=False)
            if not terms_checkbox:
                terms_checkbox = await tab.query("input[type='checkbox']")
            
            await terms_checkbox.click()
            
            # Find and click submit button
            submit_button = await tab.find(
                tag_name="button",
                type="submit",
                timeout=2
            )
            await submit_button.click()
            
            # Wait for success message with longer timeout (form processing)
            success_message = await tab.find(
                class_name="success-message",
                timeout=15
            )
            
            message_text = await success_message.text
            print(f"Registration successful: {message_text}")
            
            # Verify redirect to dashboard
            await asyncio.sleep(2)
            current_url = await tab.current_url
            
            if "dashboard" in current_url:
                print("Successfully redirected to dashboard")
                
                # Find welcome message
                welcome = await tab.find(class_name="welcome-message", timeout=5)
                welcome_text = await welcome.text
                print(f"Welcome message: {welcome_text}")
            else:
                print(f"Unexpected URL after registration: {current_url}")
                
        except ElementNotFound as e:
            print(f"Element not found: {e}")
            # Take screenshot for debugging
            await tab.take_screenshot("error_screenshot.png")
        except Exception as e:
            print(f"Unexpected error: {e}")
            await tab.take_screenshot("unexpected_error.png")

asyncio.run(automate_registration_form())
```

## Learn More

Want to dive deeper into element finding?

- **[FindElements Mixin Deep Dive](../deep-dive/find-elements-mixin.md)**: Learn about the architecture, internal selector strategies, and performance optimizations
- **[Selectors Guide](../deep-dive/selectors-guide.md)**: Comprehensive guide to CSS selectors and XPath with syntax references and real-world examples
- **[WebElement Domain](../deep-dive/webelement-domain.md)**: Understand what you can do with elements once you've found them

Element finding is the foundation of successful browser automation. Master these techniques, and you'll be able to reliably locate any element on any web page, no matter how complex the structure.


================================================
FILE: docs/en/features/index.md
================================================
# Features Guide

Welcome to Pydoll's comprehensive features documentation! This is where you'll discover everything that makes Pydoll a powerful and flexible browser automation tool. Whether you're just starting out or looking to leverage advanced capabilities, you'll find detailed guides, practical examples, and best practices for each feature.

## What You'll Find Here

This guide is organized into logical sections that reflect your automation journey: from basic concepts to advanced techniques. Each page is designed to be self-contained, so you can jump directly to what interests you or follow along sequentially.

## Core Concepts

Before diving into specific features, it's worth understanding what sets Pydoll apart. These foundational concepts inform how the entire library works.

**[Core Concepts](core-concepts.md)**: Discover the architectural decisions that make Pydoll different: the zero-webdriver approach that eliminates compatibility headaches, the async-first design that enables true concurrent operations, and native support for multiple Chromium-based browsers.

## Element Finding & Interaction

Finding and interacting with page elements is the bread and butter of automation. Pydoll makes this surprisingly intuitive with modern APIs that just make sense.

**[Element Finding](element-finding.md)**: Master Pydoll's element location strategies, from the intuitive `find()` method that uses natural HTML attributes, to the powerful `query()` method for CSS selectors and XPath. You'll also learn about DOM traversal helpers that let you navigate the page structure efficiently.

## Automation Capabilities

These are the features that bring your automation to life: simulating user interactions, keyboard control, handling file operations, working with iframes, and capturing visual content.

**[Human-Like Interactions](automation/human-interactions.md)**: Learn how to create interactions that feel genuinely human: typing with natural timing variations, clicking with realistic mouse movements, and using keyboard shortcuts just like a real user would. This is crucial for avoiding detection in automation-sensitive sites.

**[Keyboard Control](automation/keyboard-control.md)**: Master keyboard interactions with comprehensive support for key combinations, modifiers, and special keys. Essential for forms, shortcuts, and accessibility testing.

**[File Operations](automation/file-operations.md)**: File handling can be tricky in browser automation. Pydoll provides robust solutions for both uploads and downloads, with the `expect_download` context manager offering elegant handling of asynchronous download completion.

**[IFrame Interaction](automation/iframes.md)**: Treat iframes like regular elements—find the iframe and keep searching inside it. No extra targets, no extra tabs.

**[Screenshots & PDF](automation/screenshots-and-pdfs.md)**: Capture visual content from your automation sessions. Whether you need full-page screenshots for visual regression testing, element-specific captures for debugging, or PDF exports for archival, Pydoll has you covered.

## Network Features

Pydoll's network capabilities are where it truly shines, giving you unprecedented visibility and control over HTTP traffic.

**[Network Monitoring](network/monitoring.md)**: Observe and analyze all network activity in your browser session. Extract API responses, track request timing, identify failed requests, and understand exactly what data is being exchanged. Essential for debugging, testing, and data extraction.

**[Request Interception](network/interception.md)**: Go beyond observation to actively modify network behavior. Block unwanted resources, inject custom headers, modify request payloads, or even fulfill requests with mock data. This is powerful for testing, optimization, and privacy control.

**[Browser-Context HTTP Requests](network/http-requests.md)**: Make HTTP requests that execute within the browser's JavaScript context, automatically inheriting session state, cookies, and authentication. This hybrid approach combines the familiarity of Python's `requests` library with browser-context execution benefits.

## Browser Management

Effective browser and tab management is essential for complex automation scenarios, parallel processing, and multi-user testing.

**[Multi-Tab Management](browser-management/tabs.md)**: Work with multiple browser tabs simultaneously, ensuring efficient resource usage while giving you full control over tab lifecycle, detection of user-opened tabs, and concurrent scraping operations.

**[Browser Contexts](browser-management/contexts.md)**: Create completely isolated browsing environments within a single browser process. Each context maintains separate cookies, storage, cache, and permissions: perfect for multi-account testing, A/B testing, or parallel scraping with different configurations.


**[Cookies & Sessions](browser-management/cookies-sessions.md)**: Manage session state at both browser and tab levels. Set cookies programmatically, extract session data, and maintain different sessions across browser contexts for sophisticated testing scenarios.


## Configuration

Customize every aspect of browser behavior to match your automation needs, from low-level Chromium preferences to command-line arguments and page loading strategies.

**[Browser Options](configuration/browser-options.md)**: Configure Chromium's launch parameters, command-line arguments, and page load state control. Fine-tune browser behavior, enable experimental features, and optimize performance for your automation needs.

**[Browser Preferences](configuration/browser-preferences.md)**: Direct access to Chromium's internal preference system gives you control over hundreds of settings. Configure downloads, disable features, optimize performance, or create realistic browser fingerprints for stealth automation.

**[Proxy Configuration](configuration/proxy.md)**: Native proxy support with full authentication capabilities. Essential for web scraping projects requiring IP rotation, geo-targeted testing, or privacy-focused automation.


## Advanced Features

These sophisticated capabilities address complex automation challenges and specialized use cases.

**[Behavioral Captcha Bypass](advanced/behavioral-captcha-bypass.md)**: Pydoll's native behavioral captcha handling is one of its most requested features. Learn how to interact with Cloudflare Turnstile, reCAPTCHA v3, and hCaptcha invisible challenges using two approaches - synchronous context manager for guaranteed completion, and background processing for non-blocking operation.

**[Event System](advanced/event-system.md)**: Build reactive automation that responds to browser events in real-time. Monitor page loads, network activity, DOM changes, and JavaScript execution to create intelligent, adaptive automation scripts.

**[Remote Connections](advanced/remote-connections.md)**: Connect to already-running browsers via WebSocket for hybrid automation scenarios. Perfect for CI/CD pipelines, containerized environments, or integrating Pydoll into existing CDP tooling.


## How to Use This Guide

Each feature page follows a consistent structure:

1. **Overview** - What the feature does and why it matters
2. **Basic Usage** - Get started quickly with simple examples
3. **Advanced Patterns** - Leverage the feature's full potential
4. **Best Practices** - Tips for effective and efficient usage
5. **Common Pitfalls** - Learn from common mistakes

Feel free to explore features in any order based on your needs. Code examples are complete and ready to run - just copy, paste, and adapt to your use case.

Ready to dive deep into Pydoll's capabilities? Pick a feature that interests you and start exploring! 🚀


================================================
FILE: docs/en/features/network/http-requests.md
================================================
# Browser-Context HTTP Requests

Make HTTP requests that automatically inherit your browser's session state, cookies, and authentication. Perfect for hybrid automation combining UI navigation with API efficiency.

!!! tip "Game Changer for Hybrid Automation"
    Ever wished you could make HTTP requests that automatically get all your browser's cookies and authentication? Now you can! The `tab.request` property gives you a beautiful `requests`-like interface that executes HTTP calls **directly in the browser's JavaScript context**.

## Why Use Browser-Context Requests?

Traditional automation often requires you to extract cookies and headers manually to make API calls. Browser-context requests eliminate this hassle:

| Traditional Approach | Browser-Context Requests |
|---------------------|-------------------------|
| Extract cookies manually | Cookies inherited automatically |
| Manage session tokens | Session state preserved |
| Handle CORS separately | CORS policies respected |
| Juggle two HTTP clients | One unified interface |
| Sync authentication state | Always authenticated |

**Perfect for:**

- Scraping authenticated APIs after login via UI
- Hybrid workflows mixing browser interaction and API calls
- Testing authenticated endpoints without token management
- Bypassing complex authentication flows
- Working with single-page applications (SPAs)

## Quick Start

The simplest example: +login via UI, then make authenticated API calls:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def hybrid_automation():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # 1. Login normally through the UI
        await tab.go_to('https://example.com/login')
        await (await tab.find(id='username')).type_text('user@example.com')
        await (await tab.find(id='password')).type_text('password123')
        await (await tab.find(id='login-btn')).click()
        
        # Wait for redirect after login
        await asyncio.sleep(2)
        
        # 2. Now make API calls with the authenticated session!
        response = await tab.request.get('https://example.com/api/user/profile')
        user_data = response.json()
        
        print(f"Logged in as: {user_data['name']}")
        print(f"Email: {user_data['email']}")

asyncio.run(hybrid_automation())
```

!!! success "No Cookie Management Required"
    Notice how we didn't extract or pass any cookies? The request automatically inherited the browser's authenticated session!

## Common Use Cases

### 1. Scraping Authenticated APIs

Use the UI to login, then hammer APIs for data extraction:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def scrape_user_data():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Login via UI (handles complex auth flows)
        await tab.go_to('https://app.example.com/login')
        await (await tab.find(id='email')).type_text('user@example.com')
        await (await tab.find(id='password')).type_text('password')
        await (await tab.find(type='submit')).click()
        await asyncio.sleep(2)
        
        # Now extract data via API (much faster than scraping UI)
        all_users = []
        for page in range(1, 6):
            response = await tab.request.get(
                f'https://app.example.com/api/users',
                params={'page': str(page), 'limit': '100'}
            )
            users = response.json()['users']
            all_users.extend(users)
            print(f"Page {page}: fetched {len(users)} users")
        
        print(f"Total users scraped: {len(all_users)}")

asyncio.run(scrape_user_data())
```

### 2. Testing Protected Endpoints

Test API endpoints without managing authentication tokens:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def test_api_endpoints():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Authenticate once
        await tab.go_to('https://api.example.com/login')
        # ... perform login ...
        await asyncio.sleep(2)
        
        # Test multiple endpoints
        endpoints = [
            '/api/users/me',
            '/api/settings',
            '/api/notifications',
            '/api/dashboard/stats'
        ]
        
        for endpoint in endpoints:
            response = await tab.request.get(f'https://api.example.com{endpoint}')
            
            if response.ok:
                print(f"Success {endpoint}: {response.status_code}")
            else:
                print(f"Failed {endpoint}: {response.status_code}")
                print(f"   Error: {response.text[:100]}")

asyncio.run(test_api_endpoints())
```

### 3. Submitting Forms via API

Fill forms faster by posting directly to the API:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def bulk_form_submission():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Login first
        await tab.go_to('https://crm.example.com/login')
        # ... login logic ...
        await asyncio.sleep(2)
        
        # Submit multiple entries via API (much faster than filling forms)
        contacts = [
            {'name': 'John Doe', 'email': 'john@example.com', 'company': 'Acme Inc'},
            {'name': 'Jane Smith', 'email': 'jane@example.com', 'company': 'Tech Corp'},
            {'name': 'Bob Wilson', 'email': 'bob@example.com', 'company': 'StartupXYZ'},
        ]
        
        for contact in contacts:
            response = await tab.request.post(
                'https://crm.example.com/api/contacts',
                json=contact
            )
            
            if response.ok:
                print(f"Added: {contact['name']}")
            else:
                print(f"Failed: {contact['name']} - {response.status_code}")

asyncio.run(bulk_form_submission())
```

### 4. Downloading Files with Session

Download files that require authentication:

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def download_authenticated_file():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Authenticate
        await tab.go_to('https://portal.example.com/login')
        # ... login logic ...
        await asyncio.sleep(2)
        
        # Download file that requires authentication
        response = await tab.request.get(
            'https://portal.example.com/api/reports/monthly.pdf'
        )
        
        if response.ok:
            # Save the file
            output_path = Path('/tmp/monthly_report.pdf')
            output_path.write_bytes(response.content)
            print(f"Downloaded: {output_path} ({len(response.content)} bytes)")
        else:
            print(f"Download failed: {response.status_code}")

asyncio.run(download_authenticated_file())
```

### 5. Working with Custom Headers

Add custom headers to your requests:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.types import HeaderEntry

async def custom_headers_example():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Login first
        await tab.go_to('https://api.example.com/login')
        # ... login logic ...
        
        # Make request with custom headers
        headers: list[HeaderEntry] = [
            {'name': 'X-API-Version', 'value': '2.0'},
            {'name': 'X-Request-ID', 'value': 'unique-id-123'},
            {'name': 'Accept-Language', 'value': 'pt-BR,pt;q=0.9'},
        ]
        
        response = await tab.request.get(
            'https://api.example.com/data',
            headers=headers
        )
        
        print(f"Status: {response.status_code}")
        print(f"Data: {response.json()}")

asyncio.run(custom_headers_example())
```

### 6. Handling Different Response Types

Access response data in multiple formats:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def response_formats():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://api.example.com')
        
        # JSON response
        json_response = await tab.request.get('/api/users/1')
        user = json_response.json()
        print(f"JSON: {user}")
        
        # Text response
        text_response = await tab.request.get('/api/status')
        status_text = text_response.text
        print(f"Text: {status_text}")
        
        # Binary response (e.g., image)
        image_response = await tab.request.get('/api/avatar/1')
        image_bytes = image_response.content
        print(f"Binary: {len(image_bytes)} bytes")
        
        # Check response status
        if json_response.ok:
            print("Request successful!")
        
        # Access response URL (useful after redirects)
        print(f"Final URL: {json_response.url}")

asyncio.run(response_formats())
```

## HTTP Methods

All standard HTTP methods are supported:

### GET - Retrieve Data

```python
# Simple GET
response = await tab.request.get('https://api.example.com/users')

# GET with query parameters
response = await tab.request.get(
    'https://api.example.com/search',
    params={'q': 'python', 'limit': '10'}
)
```

### POST - Create Resources

```python
# POST with JSON data
response = await tab.request.post(
    'https://api.example.com/users',
    json={'name': 'John Doe', 'email': 'john@example.com'}
)

# POST with form data
response = await tab.request.post(
    'https://api.example.com/login',
    data={'username': 'john', 'password': 'secret'}
)
```

### PUT - Update Resources

```python
# Update entire resource
response = await tab.request.put(
    'https://api.example.com/users/123',
    json={'name': 'Jane Doe', 'email': 'jane@example.com', 'role': 'admin'}
)
```

### PATCH - Partial Updates

```python
# Update specific fields
response = await tab.request.patch(
    'https://api.example.com/users/123',
    json={'email': 'newemail@example.com'}
)
```

### DELETE - Remove Resources

```python
# Delete a resource
response = await tab.request.delete('https://api.example.com/users/123')
```

### HEAD - Get Headers Only

```python
# Check if resource exists without downloading it
response = await tab.request.head('https://example.com/large-file.zip')
print(f"Content-Length: {response.headers}")
```

### OPTIONS - Check Capabilities

```python
# Check allowed methods
response = await tab.request.options('https://api.example.com/users')
print(f"Allowed methods: {response.headers}")
```

!!! info "How Does This Work?"
    Browser-context requests execute HTTP calls directly in the browser's JavaScript context using the Fetch API, while monitoring CDP network events to capture comprehensive metadata (headers, cookies, timing).
    
    For a detailed explanation of the internal architecture, event monitoring, and implementation details, see [Browser Requests Architecture](../../deep-dive/browser-requests-architecture.md).

## Response Object

The `Response` object provides a familiar interface similar to `requests.Response`:

```python
response = await tab.request.get('https://api.example.com/users')

# Status code
print(response.status_code)  # 200, 404, 500, etc.

# Check if successful (2xx or 3xx)
if response.ok:
    print("Success!")

# Response body
text_data = response.text      # As string
byte_data = response.content   # As bytes
json_data = response.json()    # Parsed JSON

# Headers
for header in response.headers:
    print(f"{header['name']}: {header['value']}")

# Request headers (what was actually sent)
for header in response.request_headers:
    print(f"{header['name']}: {header['value']}")

# Cookies set by the response
for cookie in response.cookies:
    print(f"{cookie['name']} = {cookie['value']}")

# Final URL (after redirects)
print(response.url)

# Raise exception for error status codes
response.raise_for_status()  # Raises HTTPError if 4xx or 5xx
```

!!! note "Redirects and URL Tracking"
    The `response.url` property contains only the **final URL** after all redirects. If you need to track the complete redirect chain (intermediate URLs, status codes, timing), use [Network Monitoring](monitoring.md) to observe all requests in detail.

## Headers and Cookies

### Working with Headers

Headers are represented as `HeaderEntry` objects:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.types import HeaderEntry

async def header_example():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Using HeaderEntry type for IDE autocomplete and type checking
        headers: list[HeaderEntry] = [
            {'name': 'Authorization', 'value': 'Bearer token-123'},
            {'name': 'X-Custom-Header', 'value': 'custom-value'},
        ]
        
        response = await tab.request.get(
            'https://api.example.com/protected',
            headers=headers
        )
        
        # Inspect response headers (also HeaderEntry typed dicts)
        for header in response.headers:
            if header['name'] == 'Content-Type':
                print(f"Content-Type: {header['value']}")

asyncio.run(header_example())
```

!!! tip "Type Hints for Headers"
    `HeaderEntry` is a `TypedDict` from `pydoll.protocol.fetch.types`. Using it as a type hint gives you:
    
    - **Autocomplete**: IDE suggests `name` and `value` keys
    - **Type safety**: Catch typos and missing keys before running
    - **Documentation**: Clear structure for headers
    
    While you can pass plain dictionaries, using the type hint improves code quality and IDE support.

!!! tip "Custom Headers Behavior"
    Custom headers are sent **alongside** the browser's automatic headers (like `User-Agent`, `Accept`, `Referer`, etc.). 
    
    If you try to set a standard browser header (e.g., `User-Agent`), the behavior depends on the specific header; some may be overridden, others ignored, and some may cause conflicts. For most use cases, stick to custom headers (e.g., `X-API-Key`, `Authorization`) to avoid unexpected behavior.

### Understanding Cookies

Cookies are automatically managed by the browser:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def cookie_example():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # First request sets cookies
        login_response = await tab.request.post(
            'https://api.example.com/login',
            json={'username': 'user', 'password': 'pass'}
        )
        
        # Check cookies set by server
        print("Cookies set by server:")
        for cookie in login_response.cookies:
            print(f"  {cookie['name']} = {cookie['value']}")
        
        # Subsequent requests automatically include cookies
        profile_response = await tab.request.get(
            'https://api.example.com/profile'
        )
        # No need to pass cookies - browser handles it!
        
        print(f"Profile data: {profile_response.json()}")

asyncio.run(cookie_example())
```

## Comparison with Traditional Requests

| Feature | `requests` Library | Browser-Context Requests |
|---------|-------------------|-------------------------|
| **Session Management** | Manual cookie handling | Automatic via browser |
| **Authentication** | Extract and pass tokens | Inherited from browser |
| **CORS** | Not applicable | Browser enforces policies |
| **JavaScript** | Cannot execute | Full access to browser context |
| **Cookie Jar** | Separate instance | Browser's native cookie store |
| **Headers** | Manually set | Browser auto-adds standard headers |
| **Use Case** | Server-side scripts | Browser automation |
| **Setup** | External library | Built into Pydoll |

## See Also

- **[Browser Requests Architecture](../../deep-dive/browser-requests-architecture.md)** - Internal implementation and architecture
- **[Network Monitoring](monitoring.md)** - Observe all network traffic
- **[Request Interception](interception.md)** - Modify requests before they're sent
- **[Event System](../advanced/event-system.md)** - React to browser events
- **[Deep Dive: Network Capabilities](../../deep-dive/network-capabilities.md)** - Technical details

Browser-context requests are a game-changer for hybrid automation. Combine the power of UI automation with the speed of direct API calls, all while maintaining perfect session continuity!


================================================
FILE: docs/en/features/network/interception.md
================================================
# Request Interception

Request interception allows you to intercept, modify, block, or mock HTTP requests and responses in real-time. This is essential for testing, performance optimization, content filtering, and simulating various network conditions.

!!! info "Network vs Fetch Domain"
    **Network domain** is for passive monitoring (observing traffic). **Fetch domain** is for active interception (modifying/blocking requests). This guide focuses on interception. For passive monitoring, see [Network Monitoring](monitoring.md).

## Understanding Request Interception

When you enable request interception, Pydoll pauses matching requests before they're sent to the server (or after receiving the response). You then have three options:

1. **Continue**: Let the request proceed (optionally with modifications)
2. **Block**: Fail the request with an error
3. **Mock**: Fulfill the request with a custom response

```mermaid
sequenceDiagram
    participant Browser
    participant Pydoll
    participant Server
    
    Browser->>Pydoll: Request initiated
    Note over Pydoll: Request Paused
    Pydoll->>Pydoll: Callback executed
    
    alt Continue
        Pydoll->>Server: Forward request
        Server-->>Browser: Response
    else Block
        Pydoll-->>Browser: Error response
    else Mock
        Pydoll-->>Browser: Custom response
    end
```

!!! warning "Performance Impact"
    Request interception adds latency to every matching request. Only intercept what you need and disable when done to avoid slowing down page loads.

## Enabling Request Interception

Before intercepting requests, you must enable the Fetch domain:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def main():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Enable fetch events (intercepts all requests by default)
        await tab.enable_fetch_events()
        
        await tab.go_to('https://example.com')
        
        # Disable when done
        await tab.disable_fetch_events()

asyncio.run(main())
```

### Selective Interception

You can filter which requests to intercept by resource type:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def selective_interception():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Only intercept images and stylesheets
        await tab.enable_fetch_events(
            resource_type='Image'  # Or 'Stylesheet', 'Script', etc.
        )
        
        await tab.go_to('https://example.com')
        await tab.disable_fetch_events()

asyncio.run(selective_interception())
```

!!! tip "Resource Types"
    See the [Resource Types Reference](#resource-types-reference) section for a complete list of interceptable resource types.

## Intercepting Requests

Use the `RequestPaused` event to intercept requests:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent

async def basic_interception():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Callback with type hint for IDE support
        async def handle_request(event: RequestPausedEvent):
            request_id = event['params']['requestId']
            url = event['params']['request']['url']
            
            print(f"Intercepted: {url}")
            
            # Continue the request without modifications
            await tab.continue_request(request_id)
        
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, handle_request)
        
        await tab.go_to('https://example.com')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(basic_interception())
```

!!! info "Type Hints for Better IDE Support"
    Use type hints like `RequestPausedEvent` to get autocomplete for event keys. All event types are in `pydoll.protocol.fetch.events`.

!!! note "Production-Ready Waiting"
    The examples in this guide use `asyncio.sleep()` for simplicity. In production code, consider using more explicit waiting strategies like waiting for specific elements or implementing network idle detection. See the [Network Monitoring](monitoring.md) guide for advanced techniques.

## Common Use Cases

### 1. Blocking Resources to Save Bandwidth

Block images, stylesheets, or other resources to speed up page loads:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent
from pydoll.protocol.network.types import ErrorReason

async def block_images():
    async with Chrome() as browser:
        tab = await browser.start()
        
        blocked_count = 0
        
        async def block_resource(event: RequestPausedEvent):
            nonlocal blocked_count
            request_id = event['params']['requestId']
            resource_type = event['params']['resourceType']
            url = event['params']['request']['url']
            
            # Block images and stylesheets
            if resource_type in ['Image', 'Stylesheet']:
                blocked_count += 1
                print(f"🚫 Blocked {resource_type}: {url[:60]}")
                await tab.fail_request(request_id, ErrorReason.BLOCKED_BY_CLIENT)
            else:
                # Continue other requests
                await tab.continue_request(request_id)
        
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, block_resource)
        
        await tab.go_to('https://example.com')
        await asyncio.sleep(3)
        
        print(f"\n📊 Total blocked: {blocked_count} resources")
        
        await tab.disable_fetch_events()

asyncio.run(block_images())
```

### 2. Modifying Request Headers

Add, modify, or remove headers before requests are sent:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent
from pydoll.protocol.fetch.types import HeaderEntry

async def modify_headers():
    async with Chrome() as browser:
        tab = await browser.start()
        
        async def add_custom_headers(event: RequestPausedEvent):
            request_id = event['params']['requestId']
            url = event['params']['request']['url']
            
            # Only modify API requests
            if '/api/' in url:
                # Build custom headers (using HeaderEntry type hint for IDE support)
                headers: list[HeaderEntry] = [
                    {'name': 'X-Custom-Header', 'value': 'MyValue'},
                    {'name': 'Authorization', 'value': 'Bearer my-token-123'},
                ]
                
                print(f"✨ Modified headers for: {url}")
                await tab.continue_request(request_id, headers=headers)
            else:
                await tab.continue_request(request_id)
        
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, add_custom_headers)
        
        await tab.go_to('https://your-app.com')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(modify_headers())
```

!!! tip "Type Hints for Headers"
    `HeaderEntry` is a `TypedDict` from `pydoll.protocol.fetch.types`. Using it as a type hint gives you IDE autocomplete for `name` and `value` keys. You can also use plain dictionaries without the type hint.

!!! tip "Header Management"
    When you provide custom headers, they **replace** all existing headers. Make sure to include necessary headers like `User-Agent`, `Accept`, etc., if needed.

### 3. Mocking API Responses

Replace real API responses with custom mock data:

```python
import asyncio
import json
import base64
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent
from pydoll.protocol.fetch.types import HeaderEntry

async def mock_api_responses():
    async with Chrome() as browser:
        tab = await browser.start()
        
        async def mock_response(event: RequestPausedEvent):
            request_id = event['params']['requestId']
            url = event['params']['request']['url']
            
            # Mock specific API endpoint
            if '/api/users' in url:
                # Create mock response data
                mock_data = {
                    'users': [
                        {'id': 1, 'name': 'Mock User 1'},
                        {'id': 2, 'name': 'Mock User 2'},
                    ],
                    'total': 2
                }
                
                # Convert to JSON and base64-encode
                body_json = json.dumps(mock_data)
                body_base64 = base64.b64encode(body_json.encode()).decode()
                
                # Response headers
                headers: list[HeaderEntry] = [
                    {'name': 'Content-Type', 'value': 'application/json'},
                    {'name': 'Access-Control-Allow-Origin', 'value': '*'},
                ]
                
                print(f"🎭 Mocked response for: {url}")
                await tab.fulfill_request(
                    request_id=request_id,
                    response_code=200,
                    response_headers=headers,
                    body=body_base64,
                    response_phrase='OK'
                )
            else:
                # Continue other requests normally
                await tab.continue_request(request_id)
        
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, mock_response)
        
        await tab.go_to('https://your-app.com')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(mock_api_responses())
```

!!! warning "Base64 Encoding Required"
    The `body` parameter in `fulfill_request()` must be base64-encoded. Use Python's `base64` module to encode your response data.

### 4. Modifying Request URLs

Redirect requests to different URLs:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent

async def redirect_requests():
    async with Chrome() as browser:
        tab = await browser.start()
        
        async def redirect_url(event: RequestPausedEvent):
            request_id = event['params']['requestId']
            original_url = event['params']['request']['url']
            
            # Redirect CDN requests to local server
            if 'cdn.example.com' in original_url:
                new_url = original_url.replace(
                    'cdn.example.com',
                    'localhost:8080'
                )
                print(f"🔀 Redirected: {original_url} → {new_url}")
                await tab.continue_request(request_id, url=new_url)
            else:
                await tab.continue_request(request_id)
        
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, redirect_url)
        
        await tab.go_to('https://example.com')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(redirect_requests())
```

### 5. Modifying Request Body

Modify POST data before sending:

```python
import asyncio
import base64
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent

async def modify_post_data():
    async with Chrome() as browser:
        tab = await browser.start()
        
        async def modify_body(event: RequestPausedEvent):
            request_id = event['params']['requestId']
            method = event['params']['request']['method']
            url = event['params']['request']['url']
            
            # Modify POST requests
            if method == 'POST' and '/api/submit' in url:
                # Create new POST data
                new_data = '{"modified": true, "timestamp": 123456789}'
                post_data_base64 = base64.b64encode(new_data.encode()).decode()
                
                print(f"✏️  Modified POST data for: {url}")
                await tab.continue_request(
                    request_id,
                    post_data=post_data_base64
                )
            else:
                await tab.continue_request(request_id)
        
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, modify_body)
        
        await tab.go_to('https://your-app.com/form')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(modify_post_data())
```

### 6. Handling Authentication Challenges

Manually respond to HTTP authentication challenges (Basic Auth, Digest Auth, etc.):

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, AuthRequiredEvent
from pydoll.protocol.fetch.types import AuthChallengeResponseType

async def handle_auth():
    async with Chrome() as browser:
        tab = await browser.start()
        
        async def respond_to_auth(event: AuthRequiredEvent):
            request_id = event['params']['requestId']
            auth_challenge = event['params']['authChallenge']
            
            print(f"🔐 Auth challenge from: {auth_challenge['origin']}")
            print(f"   Scheme: {auth_challenge['scheme']}")
            print(f"   Realm: {auth_challenge.get('realm', 'N/A')}")
            
            # Provide credentials for the authentication challenge
            await tab.continue_with_auth(
                request_id=request_id,
                auth_challenge_response=AuthChallengeResponseType.PROVIDE_CREDENTIALS,
                proxy_username='myuser',
                proxy_password='mypassword'
            )
        
        # Enable with auth handling
        await tab.enable_fetch_events(handle_auth=True)
        await tab.on(FetchEvent.AUTH_REQUIRED, respond_to_auth)
        
        await tab.go_to('https://httpbin.org/basic-auth/myuser/mypassword')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(handle_auth())
```

!!! note "Automatic Proxy Authentication"
    **Pydoll automatically handles proxy authentication** (407 Proxy Authentication Required) when you configure proxy credentials via browser options. This example demonstrates **manual handling** of authentication challenges, which is useful for:
    
    - HTTP Basic/Digest Authentication from servers (401 Unauthorized)
    - Custom authentication flows
    - Dynamic credential selection based on the challenge
    - Testing authentication failure scenarios
    
    For standard proxy usage, simply configure your proxy credentials in browser options - no manual handling needed!

### 7. Simulating Network Errors

Test how your application handles network failures:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent
from pydoll.protocol.network.types import ErrorReason

async def simulate_errors():
    async with Chrome() as browser:
        tab = await browser.start()
        
        request_count = 0
        
        async def fail_some_requests(event: RequestPausedEvent):
            nonlocal request_count
            request_id = event['params']['requestId']
            url = event['params']['request']['url']
            
            request_count += 1
            
            # Fail every 3rd request
            if request_count % 3 == 0:
                print(f"❌ Simulating timeout for: {url[:60]}")
                await tab.fail_request(request_id, ErrorReason.TIMED_OUT)
            else:
                await tab.continue_request(request_id)
        
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, fail_some_requests)
        
        await tab.go_to('https://example.com')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(simulate_errors())
```

## Request Stages

You can intercept requests at different stages:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.types import RequestStage

async def intercept_responses():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Intercept responses instead of requests
        await tab.enable_fetch_events(request_stage=RequestStage.RESPONSE)
        
        # Now you can modify responses before they reach the page
        await tab.go_to('https://example.com')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(intercept_responses())
```

| Stage | When Intercepted | Use Cases |
|-------|------------------|-----------|
| `Request` (default) | Before request is sent | Modify headers, block requests, change URL |
| `Response` | After response received | Modify response body, change status codes |

!!! tip "Response Interception"
    When intercepting responses, you can use `intercept_response=True` in `continue_request()` to also intercept the response for that specific request.

## Resource Types Reference

| Resource Type | Description | Common File Extensions |
|---------------|-------------|------------------------|
| `Document` | HTML documents | `.html` |
| `Stylesheet` | CSS files | `.css` |
| `Image` | Image resources | `.jpg`, `.png`, `.gif`, `.webp`, `.svg` |
| `Media` | Audio/video | `.mp4`, `.webm`, `.mp3`, `.ogg` |
| `Font` | Web fonts | `.woff`, `.woff2`, `.ttf`, `.otf` |
| `Script` | JavaScript | `.js` |
| `TextTrack` | Subtitles | `.vtt`, `.srt` |
| `XHR` | XMLHttpRequest | AJAX requests |
| `Fetch` | Fetch API | Modern API calls |
| `EventSource` | Server-Sent Events | Real-time streams |
| `WebSocket` | WebSocket | Bidirectional communication |
| `Manifest` | Web app manifest | PWA configuration |
| `Other` | Other types | Miscellaneous |

## Error Reasons Reference

Use these with `fail_request()` to simulate different network failures:

| Error Reason | Description | Use Case |
|--------------|-------------|----------|
| `FAILED` | Generic failure | General error |
| `ABORTED` | Request aborted | User cancelled |
| `TIMED_OUT` | Request timeout | Network timeout |
| `ACCESS_DENIED` | Access denied | Permission error |
| `CONNECTION_CLOSED` | Connection closed | Server disconnect |
| `CONNECTION_RESET` | Connection reset | Network reset |
| `CONNECTION_REFUSED` | Connection refused | Server unreachable |
| `NAME_NOT_RESOLVED` | DNS failure | Invalid hostname |
| `INTERNET_DISCONNECTED` | No internet | Offline mode |
| `BLOCKED_BY_CLIENT` | Client blocked | Ad blocker simulation |
| `BLOCKED_BY_RESPONSE` | Response blocked | CORS/CSP violation |

## Best Practices

### 1. Always Continue or Fail Requests

```python
# Good: Every paused request is handled
async def handle_request(event: RequestPausedEvent):
    request_id = event['params']['requestId']
    try:
        # Your logic here
        await tab.continue_request(request_id)
    except Exception as e:
        # Fail on error to prevent hanging
        await tab.fail_request(request_id, ErrorReason.FAILED)

# Bad: Request might hang if callback raises exception
async def handle_request(event: RequestPausedEvent):
    request_id = event['params']['requestId']
    # If this raises, request hangs forever
    await tab.continue_request(request_id)
```

### 2. Use Selective Interception

```python
# Good: Only intercept what you need
await tab.enable_fetch_events(resource_type='Image')

# Bad: Intercepts everything, slows down all requests
await tab.enable_fetch_events()
```

### 3. Disable When Done

```python
# Good: Clean up after yourself
await tab.enable_fetch_events()
# ... do work ...
await tab.disable_fetch_events()

# Bad: Leaves interception enabled
await tab.enable_fetch_events()
# ... do work ...
# (never disabled)
```

### 4. Handle Errors Gracefully

```python
# Good: Wrap in try/except
async def safe_handler(event: RequestPausedEvent):
    request_id = event['params']['requestId']
    try:
        # Complex logic that might fail
        modified_url = transform_url(event['params']['request']['url'])
        await tab.continue_request(request_id, url=modified_url)
    except Exception as e:
        print(f"Error handling request: {e}")
        # Continue without modifications on error
        await tab.continue_request(request_id)
```

## Complete Example: Advanced Request Control

Here's a complete example combining multiple interception techniques:

```python
import asyncio
import base64
import json
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent
from pydoll.protocol.fetch.types import HeaderEntry
from pydoll.protocol.network.types import ErrorReason

async def advanced_interception():
    async with Chrome() as browser:
        tab = await browser.start()
        
        stats = {
            'blocked': 0,
            'mocked': 0,
            'modified': 0,
            'continued': 0
        }
        
        async def intelligent_handler(event: RequestPausedEvent):
            request_id = event['params']['requestId']
            url = event['params']['request']['url']
            resource_type = event['params']['resourceType']
            method = event['params']['request']['method']
            
            try:
                # Block ads and trackers
                if any(tracker in url for tracker in ['analytics', 'ads', 'tracking']):
                    stats['blocked'] += 1
                    print(f"🚫 Blocked tracker: {url[:50]}")
                    await tab.fail_request(request_id, ErrorReason.BLOCKED_BY_CLIENT)
                
                # Mock API responses
                elif '/api/config' in url:
                    stats['mocked'] += 1
                    mock_config = {'feature_x': True, 'debug_mode': False}
                    body = base64.b64encode(json.dumps(mock_config).encode()).decode()
                    headers: list[HeaderEntry] = [
                        {'name': 'Content-Type', 'value': 'application/json'},
                    ]
                    print(f"🎭 Mocked config API")
                    await tab.fulfill_request(
                        request_id, 200, headers, body, 'OK'
                    )
                
                # Add auth headers to API requests
                elif '/api/' in url and method == 'GET':
                    stats['modified'] += 1
                    headers: list[HeaderEntry] = [
                        {'name': 'Authorization', 'value': 'Bearer token-123'},
                    ]
                    print(f"✨ Added auth to: {url[:50]}")
                    await tab.continue_request(request_id, headers=headers)
                
                # Continue everything else normally
                else:
                    stats['continued'] += 1
                    await tab.continue_request(request_id)
                    
            except Exception as e:
                print(f"⚠️  Error handling request: {e}")
                # Always continue on error to prevent hanging
                await tab.continue_request(request_id)
        
        # Enable interception
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, intelligent_handler)
        
        # Navigate
        await tab.go_to('https://example.com')
        await asyncio.sleep(5)
        
        # Print stats
        print(f"\n📊 Interception Statistics:")
        print(f"   Blocked: {stats['blocked']}")
        print(f"   Mocked: {stats['mocked']}")
        print(f"   Modified: {stats['modified']}")
        print(f"   Continued: {stats['continued']}")
        print(f"   Total: {sum(stats.values())}")
        
        # Cleanup
        await tab.disable_fetch_events()

asyncio.run(advanced_interception())
```

## See Also

- **[Network Monitoring](monitoring.md)** - Passive network traffic observation
- **[CDP Fetch Domain](../../deep-dive/network-capabilities.md#fetch-domain)** - Deep dive into the Fetch domain
- **[Event System](../advanced/event-system.md)** - Understanding Pydoll's event architecture

Request interception is a powerful tool for testing, optimization, and mocking. Master these techniques to build robust, efficient browser automation scripts.


================================================
FILE: docs/en/features/network/monitoring.md
================================================
# Network Monitoring

Network monitoring in Pydoll allows you to observe and analyze HTTP requests, responses, and other network activity during browser automation. This is essential for debugging, performance analysis, API testing, and understanding how web applications communicate with servers.

!!! info "Network vs Fetch Domain"
    **Network domain** is for passive monitoring (observing traffic). **Fetch domain** is for active interception (modifying requests/responses). This guide focuses on monitoring. For request interception, see the advanced documentation.

## Enabling Network Events

Before you can monitor network activity, you must enable the Network domain:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def main():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Enable network monitoring
        await tab.enable_network_events()
        
        # Now navigate
        await tab.go_to('https://api.github.com')
        
        # Don't forget to disable when done (optional but recommended)
        await tab.disable_network_events()

asyncio.run(main())
```

!!! warning "Enable Before Navigation"
    Always enable network events **before** navigating to capture all requests. Requests made before enabling won't be captured.

## Getting Network Logs

Pydoll automatically stores network logs when network events are enabled. You can retrieve them using `get_network_logs()`:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def analyze_requests():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        
        # Navigate to a page
        await tab.go_to('https://httpbin.org/json')
        
        # Wait for page to fully load
        await asyncio.sleep(2)
        
        # Get all network logs
        logs = await tab.get_network_logs()
        
        print(f"Total requests captured: {len(logs)}")
        
        for log in logs:
            request = log['params']['request']
            print(f"→ {request['method']} {request['url']}")

asyncio.run(analyze_requests())
```

!!! note "Production-Ready Waiting"
    The examples above use `asyncio.sleep(2)` for simplicity. In production code, consider using more explicit waiting strategies:
    
    - Wait for specific elements to appear
    - Use the [Event System](../advanced/event-system.md) to detect when all resources have loaded
    - Implement network idle detection (see Real-Time Network Monitoring section)
    
    This ensures your automation waits exactly as long as needed, no more, no less.

### Filtering Network Logs

You can filter logs by URL pattern:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def filter_logs_example():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        await tab.go_to('https://example.com')
        await asyncio.sleep(2)
        
        # Get all logs
        all_logs = await tab.get_network_logs()
        
        # Get logs for specific domain
        api_logs = await tab.get_network_logs(filter='api.example.com')
        
        # Get logs for specific endpoint
        user_logs = await tab.get_network_logs(filter='/api/users')

asyncio.run(filter_logs_example())
```

## Understanding Network Event Structure

Network logs contain detailed information about each request. Here's the structure:

### RequestWillBeSentEvent

This event is fired when a request is about to be sent:

```python
{
    'method': 'Network.requestWillBeSent',
    'params': {
        'requestId': 'unique-request-id',
        'loaderId': 'loader-id',
        'documentURL': 'https://example.com',
        'request': {
            'url': 'https://api.example.com/data',
            'method': 'GET',  # or 'POST', 'PUT', 'DELETE', etc.
            'headers': {
                'User-Agent': 'Chrome/...',
                'Accept': 'application/json',
                ...
            },
            'postData': '...',  # Only present for POST/PUT requests
            'initialPriority': 'High',
            'referrerPolicy': 'strict-origin-when-cross-origin'
        },
        'timestamp': 1234567890.123,
        'wallTime': 1234567890.123,
        'initiator': {
            'type': 'script',  # or 'parser', 'other'
            'stack': {...}  # Call stack if initiated from script
        },
        'type': 'XHR',  # Resource type: Document, Script, Image, XHR, etc.
        'frameId': 'frame-id',
        'hasUserGesture': False
    }
}
```

### Key Fields Reference

| Field | Location | Type | Description |
|-------|----------|------|-------------|
| `requestId` | `params.requestId` | `str` | Unique identifier for this request |
| `url` | `params.request.url` | `str` | Complete request URL |
| `method` | `params.request.method` | `str` | HTTP method (GET, POST, etc.) |
| `headers` | `params.request.headers` | `dict` | Request headers |
| `postData` | `params.request.postData` | `str` | Request body (POST/PUT) |
| `timestamp` | `params.timestamp` | `float` | Monotonic time when request started |
| `type` | `params.type` | `str` | Resource type (Document, XHR, Image, etc.) |
| `initiator` | `params.initiator` | `dict` | What triggered this request |

## Getting Response Bodies

To get the actual response content, use `get_network_response_body()`:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def fetch_api_response():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        
        # Navigate to API endpoint
        await tab.go_to('https://httpbin.org/json')
        await asyncio.sleep(2)
        
        # Get all requests
        logs = await tab.get_network_logs()
        
        for log in logs:
            request_id = log['params']['requestId']
            url = log['params']['request']['url']
            
            # Only get response for JSON endpoint
            if 'httpbin.org/json' in url:
                try:
                    # Get response body
                    response_body = await tab.get_network_response_body(request_id)
                    print(f"Response from {url}:")
                    print(response_body)
                except Exception as e:
                    print(f"Could not get response body: {e}")

asyncio.run(fetch_api_response())
```

!!! warning "Response Body Availability"
    Response bodies are only available for requests that have completed. Also, some response types (like images or redirects) may not have accessible bodies.

## Practical Use Cases

### 1. API Testing and Validation

Monitor API calls to verify correct requests are being made:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def validate_api_calls():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        
        # Navigate to your app
        await tab.go_to('https://your-app.com')
        
        # Trigger some action that makes API calls
        button = await tab.find(id='load-data-button')
        await button.click()
        await asyncio.sleep(2)
        
        # Get API logs
        api_logs = await tab.get_network_logs(filter='/api/')
        
        print(f"\n📊 API Calls Summary:")
        print(f"Total API calls: {len(api_logs)}")
        
        for log in api_logs:
            request = log['params']['request']
            method = request['method']
            url = request['url']
            
            # Check if correct auth header is present
            headers = request.get('headers', {})
            has_auth = 'Authorization' in headers or 'authorization' in headers
            
            print(f"\n{method} {url}")
            print(f"  ✓ Has Authorization: {has_auth}")
            
            # Validate POST data if applicable
            if method == 'POST' and 'postData' in request:
                print(f"  📤 Body: {request['postData'][:100]}...")

asyncio.run(validate_api_calls())
```

### 2. Performance Analysis

Analyze request timing and identify slow resources:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def analyze_performance():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        
        await tab.go_to('https://example.com')
        await asyncio.sleep(5)
        
        logs = await tab.get_network_logs()
        
        # Store timing data
        timings = []
        
        for log in logs:
            params = log['params']
            request_id = params['requestId']
            url = params['request']['url']
            resource_type = params.get('type', 'Other')
            
            timings.append({
                'url': url,
                'type': resource_type,
                'timestamp': params['timestamp']
            })
        
        # Sort by timestamp
        timings.sort(key=lambda x: x['timestamp'])
        
        print("\n⏱️  Request Timeline:")
        start_time = timings[0]['timestamp'] if timings else 0
        
        for timing in timings[:20]:  # Show first 20
            elapsed = (timing['timestamp'] - start_time) * 1000  # Convert to ms
            print(f"{elapsed:7.0f}ms | {timing['type']:12} | {timing['url'][:80]}")

asyncio.run(analyze_performance())
```

### 3. Detecting External Resources

Find all external domains your page connects to:

```python
import asyncio
from urllib.parse import urlparse
from collections import Counter
from pydoll.browser.chromium import Chrome

async def analyze_domains():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        
        await tab.go_to('https://news.ycombinator.com')
        await asyncio.sleep(5)
        
        logs = await tab.get_network_logs()
        
        # Count requests per domain
        domains = Counter()
        
        for log in logs:
            url = log['params']['request']['url']
            try:
                domain = urlparse(url).netloc
                if domain:
                    domains[domain] += 1
            except:
                pass
        
        print("\n🌐 External Domains:")
        for domain, count in domains.most_common(10):
            print(f"  {count:3} requests | {domain}")

asyncio.run(analyze_domains())
```

### 4. Monitoring Specific Resource Types

Track specific types of resources like images or scripts:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def track_resource_types():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        
        await tab.go_to('https://example.com')
        await asyncio.sleep(3)
        
        logs = await tab.get_network_logs()
        
        # Group by resource type
        by_type = {}
        
        for log in logs:
            params = log['params']
            resource_type = params.get('type', 'Other')
            url = params['request']['url']
            
            if resource_type not in by_type:
                by_type[resource_type] = []
            
            by_type[resource_type].append(url)
        
        print("\n📦 Resources by Type:")
        for rtype in sorted(by_type.keys()):
            urls = by_type[rtype]
            print(f"\n{rtype}: {len(urls)} resource(s)")
            for url in urls[:3]:  # Show first 3
                print(f"  • {url}")
            if len(urls) > 3:
                print(f"  ... and {len(urls) - 3} more")

asyncio.run(track_resource_types())
```

## Real-Time Network Monitoring

For real-time monitoring, use event callbacks instead of polling `get_network_logs()`:

!!! info "Understanding Events"
    Real-time monitoring uses Pydoll's event system to react to network activity as it happens. For a deep dive into how events work, see **[Event System](../advanced/event-system.md)**.

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.network.events import (
    NetworkEvent,
    RequestWillBeSentEvent,
    ResponseReceivedEvent,
    LoadingFailedEvent
)

async def real_time_monitoring():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Statistics
        stats = {
            'requests': 0,
            'responses': 0,
            'failed': 0
        }
        
        # Request callback
        async def on_request(event: RequestWillBeSentEvent):
            stats['requests'] += 1
            url = event['params']['request']['url']
            method = event['params']['request']['method']
            print(f"→ {method:6} | {url}")
        
        # Response callback
        async def on_response(event: ResponseReceivedEvent):
            stats['responses'] += 1
            response = event['params']['response']
            status = response['status']
            url = response['url']
            
            # Color code by status
            if 200 <= status < 300:
                color = '\033[92m'  # Green
            elif 300 <= status < 400:
                color = '\033[93m'  # Yellow
            else:
                color = '\033[91m'  # Red
            reset = '\033[0m'
            
            print(f"← {color}{status}{reset} | {url}")
        
        # Failed callback
        async def on_failed(event: LoadingFailedEvent):
            stats['failed'] += 1
            error = event['params']['errorText']
            print(f"✗ FAILED: {error}")
        
        # Enable and register callbacks
        await tab.enable_network_events()
        await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, on_request)
        await tab.on(NetworkEvent.RESPONSE_RECEIVED, on_response)
        await tab.on(NetworkEvent.LOADING_FAILED, on_failed)
        
        # Navigate
        await tab.go_to('https://example.com')
        await asyncio.sleep(5)
        
        print(f"\n📊 Summary:")
        print(f"  Requests: {stats['requests']}")
        print(f"  Responses: {stats['responses']}")
        print(f"  Failed: {stats['failed']}")

asyncio.run(real_time_monitoring())
```

## Resource Types Reference

Pydoll captures the following resource types:

| Type | Description | Examples |
|------|-------------|----------|
| `Document` | Main HTML documents | Page loads, iframe sources |
| `Stylesheet` | CSS files | External .css, inline styles |
| `Image` | Image resources | .jpg, .png, .gif, .webp, .svg |
| `Media` | Audio/video files | .mp4, .webm, .mp3, .ogg |
| `Font` | Web fonts | .woff, .woff2, .ttf, .otf |
| `Script` | JavaScript files | .js files, inline scripts |
| `TextTrack` | Subtitle files | .vtt, .srt |
| `XHR` | XMLHttpRequest | AJAX requests, legacy API calls |
| `Fetch` | Fetch API requests | Modern API calls |
| `EventSource` | Server-Sent Events | Real-time streams |
| `WebSocket` | WebSocket connections | Bidirectional communication |
| `Manifest` | Web app manifests | PWA configuration |
| `Other` | Other resource types | Miscellaneous |

## Advanced: Extracting Response Timing

Network events include detailed timing information:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.network.events import NetworkEvent, ResponseReceivedEvent

async def analyze_timing():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        
        # Custom callback to capture timing
        timing_data = []
        
        async def on_response(event: ResponseReceivedEvent):
            response = event['params']['response']
            timing = response.get('timing')
            
            if timing:
                # Calculate different phases
                dns_time = timing.get('dnsEnd', 0) - timing.get('dnsStart', 0)
                connect_time = timing.get('connectEnd', 0) - timing.get('connectStart', 0)
                ssl_time = timing.get('sslEnd', 0) - timing.get('sslStart', 0)
                send_time = timing.get('sendEnd', 0) - timing.get('sendStart', 0)
                wait_time = timing.get('receiveHeadersStart', 0) - timing.get('sendEnd', 0)
                receive_time = timing.get('receiveHeadersEnd', 0) - timing.get('receiveHeadersStart', 0)
                
                timing_data.append({
                    'url': response['url'][:50],
                    'dns': dns_time if dns_time > 0 else 0,
                    'connect': connect_time if connect_time > 0 else 0,
                    'ssl': ssl_time if ssl_time > 0 else 0,
                    'send': send_time,
                    'wait': wait_time,
                    'receive': receive_time,
                    'total': receive_time + wait_time + send_time
                })
        
        await tab.on(NetworkEvent.RESPONSE_RECEIVED, on_response)
        await tab.go_to('https://github.com')
        await asyncio.sleep(5)
        
        # Print timing breakdown
        print("\n⏱️  Request Timing Breakdown (ms):")
        print(f"{'URL':<50} | {'DNS':>6} | {'Connect':>8} | {'SSL':>6} | {'Send':>6} | {'Wait':>6} | {'Receive':>8} | {'Total':>7}")
        print("-" * 120)
        
        for data in sorted(timing_data, key=lambda x: x['total'], reverse=True)[:10]:
            print(f"{data['url']:<50} | {data['dns']:6.1f} | {data['connect']:8.1f} | {data['ssl']:6.1f} | "
                  f"{data['send']:6.1f} | {data['wait']:6.1f} | {data['receive']:8.1f} | {data['total']:7.1f}")

asyncio.run(analyze_timing())
```

## Timing Fields Explanation

| Phase | Fields | Description |
|-------|--------|-------------|
| **DNS** | `dnsStart` → `dnsEnd` | DNS lookup time |
| **Connect** | `connectStart` → `connectEnd` | TCP connection establishment |
| **SSL** | `sslStart` → `sslEnd` | SSL/TLS handshake |
| **Send** | `sendStart` → `sendEnd` | Time to send request |
| **Wait** | `sendEnd` → `receiveHeadersStart` | Waiting for server response (TTFB) |
| **Receive** | `receiveHeadersStart` → `receiveHeadersEnd` | Time to receive response headers |

!!! tip "Time to First Byte (TTFB)"
    TTFB is the "Wait" phase - the time between sending the request and receiving the first byte of the response. This is crucial for performance analysis.

## Best Practices

### 1. Enable Network Events Only When Needed

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def best_practice_enable():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # ✅ Good: Enable before navigation, disable after
        await tab.enable_network_events()
        await tab.go_to('https://example.com')
        await asyncio.sleep(2)
        logs = await tab.get_network_logs()
        await tab.disable_network_events()
        
        # ❌ Bad: Leaving it enabled throughout entire session
        # await tab.enable_network_events()
        # ... long automation session ...
```

### 2. Filter Logs to Reduce Memory Usage

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def best_practice_filter():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        await tab.go_to('https://example.com')
        await asyncio.sleep(2)
        
        # ✅ Good: Filter for specific requests
        api_logs = await tab.get_network_logs(filter='/api/')
        
        # ❌ Bad: Getting all logs when you only need specific ones
        all_logs = await tab.get_network_logs()
        filtered = [log for log in all_logs if '/api/' in log['params']['request']['url']]
```

### 3. Handle Missing Fields Safely

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def best_practice_safe_access():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        await tab.go_to('https://example.com')
        await asyncio.sleep(2)
        
        logs = await tab.get_network_logs()
        
        # ✅ Good: Safe access with .get()
        for log in logs:
            params = log.get('params', {})
            request = params.get('request', {})
            url = request.get('url', 'Unknown')
            post_data = request.get('postData')  # May be None
            
            if post_data:
                print(f"POST data: {post_data}")
        
        # ❌ Bad: Direct access can raise KeyError
        # url = log['params']['request']['url']
        # post_data = log['params']['request']['postData']  # May not exist!
```

### 4. Use Event Callbacks for Real-Time Needs

```python
import asyncio
from pydoll.protocol.network.events import NetworkEvent, RequestWillBeSentEvent

# ✅ Good: Real-time monitoring with callbacks
async def on_request(event: RequestWillBeSentEvent):
    print(f"New request: {event['params']['request']['url']}")

await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, on_request)

# ❌ Bad: Polling logs repeatedly (inefficient)
while True:
    logs = await tab.get_network_logs()
    # Process logs...
    await asyncio.sleep(0.5)  # Wasteful!
```

## See Also

- **[CDP Network Domain](../../deep-dive/network-capabilities.md)** - Deep dive into network capabilities
- **[Event System](../advanced/event-system.md)** - Understanding Pydoll's event architecture
- **[Request Interception](interception.md)** - Modifying requests and responses


================================================
FILE: docs/en/features/network/network-recording.md
================================================
# HAR Network Recording

Capture all network activity during a browser session and export it as a standard HAR (HTTP Archive) 1.2 file. Perfect for debugging, performance analysis, and test fixtures.

!!! tip "Debug Like a Pro"
    HAR files are the industry standard for recording network traffic. You can import them directly into Chrome DevTools, Charles Proxy, or any HAR viewer for detailed analysis.

## Why Use HAR Recording?

| Use Case | Benefit |
|----------|---------|
| Debugging failed requests | See exact headers, timing, and response bodies |
| Performance analysis | Identify slow requests and bottlenecks |
| API documentation | Capture real request/response pairs |
| Test fixtures | Record real traffic for test mocking |

## Quick Start

Record all network traffic during a page navigation:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def record_traffic():
    async with Chrome() as browser:
        tab = await browser.start()

        async with tab.request.record() as capture:
            await tab.go_to('https://example.com')

        # Save the capture as a HAR file
        capture.save('flow.har')
        print(f'Captured {len(capture.entries)} requests')

asyncio.run(record_traffic())
```

## Recording API

### `tab.request.record(resource_types=None)`

Context manager that captures network traffic on the tab.

| Parameter | Type | Description |
|-----------|------|-------------|
| `resource_types` | `list[ResourceType] \| None` | Optional list of resource types to capture. When `None` (default), all types are captured. |

```python
async with tab.request.record() as capture:
    # All network activity inside this block is captured
    await tab.go_to('https://example.com')
    await (await tab.find(id='search')).type_text('pydoll')
    await (await tab.find(type='submit')).click()
```

The `capture` object (`HarCapture`) provides:

| Property/Method | Description |
|----------------|-------------|
| `capture.entries` | List of captured HAR entries |
| `capture.to_dict()` | Full HAR 1.2 dict (for custom processing) |
| `capture.save(path)` | Save as HAR JSON file |

### Filtering by Resource Type

Record only specific resource types instead of all traffic:

```python
from pydoll.protocol.network.types import ResourceType

# Record only fetch/XHR requests (skip documents, images, etc.)
async with tab.request.record(
    resource_types=[ResourceType.FETCH, ResourceType.XHR]
) as capture:
    await tab.go_to('https://example.com')

# Record only document and stylesheet requests
async with tab.request.record(
    resource_types=[ResourceType.DOCUMENT, ResourceType.STYLESHEET]
) as capture:
    await tab.go_to('https://example.com')
```

Available `ResourceType` values:

| Value | Description |
|-------|-------------|
| `ResourceType.DOCUMENT` | HTML documents |
| `ResourceType.STYLESHEET` | CSS stylesheets |
| `ResourceType.SCRIPT` | JavaScript files |
| `ResourceType.IMAGE` | Images |
| `ResourceType.FONT` | Web fonts |
| `ResourceType.MEDIA` | Audio/video |
| `ResourceType.FETCH` | Fetch API requests |
| `ResourceType.XHR` | XMLHttpRequest calls |
| `ResourceType.WEB_SOCKET` | WebSocket connections |
| `ResourceType.OTHER` | Other resource types |

### Saving Captures

```python
# Save as HAR file (can be opened in Chrome DevTools)
capture.save('flow.har')

# Save to a nested directory (created automatically)
capture.save('recordings/session1/flow.har')

# Access the raw HAR dict for custom processing
har_dict = capture.to_dict()
print(har_dict['log']['version'])  # "1.2"
```

### Inspecting Entries

```python
async with tab.request.record() as capture:
    await tab.go_to('https://example.com')

for entry in capture.entries:
    req = entry['request']
    resp = entry['response']
    print(f"{req['method']} {req['url']} -> {resp['status']}")
```

## Advanced Usage

### Filtering Captured Entries

```python
async with tab.request.record() as capture:
    await tab.go_to('https://example.com')

# Filter only API calls
api_entries = [
    e for e in capture.entries
    if '/api/' in e['request']['url']
]

# Filter only failed requests
failed = [
    e for e in capture.entries
    if e['response']['status'] >= 400
]
```

### Custom HAR Processing

```python
har = capture.to_dict()

# Count requests by type
from collections import Counter
types = Counter(
    e.get('_resourceType', 'Other')
    for e in har['log']['entries']
)
print(types)  # Counter({'Document': 1, 'Script': 5, 'Stylesheet': 3, ...})
```

## HAR File Format

The exported HAR follows the [HAR 1.2 specification](http://www.softwareishard.com/blog/har-12-spec/). Each entry contains:

- **Request**: method, URL, headers, query parameters, POST data
- **Response**: status, headers, body content (text or base64-encoded)
- **Timings**: DNS, connect, SSL, send, wait (TTFB), receive
- **Metadata**: server IP, connection ID, resource type

!!! note "Response Bodies"
    Response bodies are captured automatically after each request completes. Binary content (images, fonts, etc.) is stored as base64-encoded strings.


================================================
FILE: docs/en/index.md
================================================
<p align="center">
    <img src="resources/images/logo.png" alt="Pydoll Logo" /> <br><br>
</p>

<p align="center">
    <a href="https://codecov.io/gh/autoscrape-labs/pydoll">
        <img src="https://codecov.io/gh/autoscrape-labs/pydoll/graph/badge.svg?token=40I938OGM9"/> 
    </a>
    <img src="https://github.com/thalissonvs/pydoll/actions/workflows/tests.yml/badge.svg" alt="Tests">
    <img src="https://github.com/thalissonvs/pydoll/actions/workflows/ruff-ci.yml/badge.svg" alt="Ruff CI">
    <img src="https://github.com/thalissonvs/pydoll/actions/workflows/release.yml/badge.svg" alt="Release">
    <img src="https://github.com/thalissonvs/pydoll/actions/workflows/mypy.yml/badge.svg" alt="MyPy CI">
</p>


# Welcome to Pydoll

Hey there! Thanks for checking out Pydoll, the next generation of browser automation for Python. If you're tired of wrestling with webdrivers and looking for a smoother, more reliable way to automate browsers, you're in the right place.

## What is Pydoll?

Pydoll is revolutionizing browser automation by **eliminating the need for webdrivers** completely! Unlike other solutions that rely on external dependencies, Pydoll connects directly to browsers using their DevTools Protocol, providing a seamless and reliable automation experience with native asynchronous performance.

Whether you're scraping data, [testing web applications](https://www.lambdatest.com/web-testing), or automating repetitive tasks, Pydoll makes it surprisingly easy with its intuitive API and powerful features.

## Installation

Create and activate a [virtual environment](https://docs.python.org/3/tutorial/venv.html) first, then install Pydoll:

<div class="termy">
```bash
$ pip install pydoll-python

---> 100%
```
</div>

For the latest development version, you can install directly from GitHub:

```bash
$ pip install git+https://github.com/autoscrape-labs/pydoll.git
```

## Why Choose Pydoll?

- **Genuine Simplicity**: We don't want you wasting time configuring drivers or dealing with compatibility issues. With Pydoll, you install and you're ready to automate.
- **Truly Human Interactions**: Our algorithms simulate real human behavior patterns - from timing between clicks to how the mouse moves across the screen.
- **Native Async Performance**: Built from the ground up with `asyncio`, Pydoll doesn't just support asynchronous operations - it was designed for them.
- **Integrated Intelligence**: Automatic bypass of Cloudflare Turnstile and reCAPTCHA v3 captchas, without external services or complex configurations.
- **Powerful Network Monitoring**: Intercept, modify, and analyze all network traffic with ease, giving you complete control over requests.
- **Event-Driven Architecture**: React to page events, network requests, and user interactions in real-time.
- **Intuitive Element Finding**: Modern `find()` and `query()` methods that make sense and work as you'd expect.
- **Robust Type Safety**: Comprehensive type system for better IDE support and error prevention.


Ready to dive in? The following pages will guide you through installation, basic usage, and advanced features to help you get the most out of Pydoll.

Let's start automating the web, the right way! 🚀

## Quick Start Guide: A simple example

Let's start with a practical example. The following script will open the Pydoll GitHub repository and star it:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def main():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://github.com/autoscrape-labs/pydoll')
        
        star_button = await tab.find(
            tag_name='button',
            timeout=5,
            raise_exc=False
        )
        if not star_button:
            print("Ops! The button was not found.")
            return

        await star_button.click()
        await asyncio.sleep(3)

asyncio.run(main())
```

This example demonstrates how to navigate to a website, wait for an element to appear, and interact with it. You can adapt this pattern to automate many different web tasks.

??? note "Or use without context manager..."
    If you prefer not to use the context manager pattern, you can manually manage the browser instance:
    
    ```python
    import asyncio
    from pydoll.browser.chromium import Chrome
    
    async def main():
        browser = Chrome()
        tab = await browser.start()
        await tab.go_to('https://github.com/autoscrape-labs/pydoll')
        
        star_button = await tab.find(
            tag_name='button',
            timeout=5,
            raise_exc=False
        )
        if not star_button:
            print("Ops! The button was not found.")
            return

        await star_button.click()
        await asyncio.sleep(3)
        await browser.stop()
    
    asyncio.run(main())
    ```
    
    Note that when not using the context manager, you'll need to explicitly call `browser.stop()` to release resources.

## Extended Example: Custom Browser Configuration

For more advanced usage scenarios, Pydoll allows you to customize your browser configuration using the `ChromiumOptions` class. This is useful when you need to:

- Run in headless mode (no visible browser window)
- Specify a custom browser executable path
- Configure proxies, user agents, or other browser settings
- Set window dimensions or startup arguments

Here's an example showing how to use custom options for Chrome:

```python hl_lines="8-12 30-32 34-38"
import asyncio
import os
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def main():
    options = ChromiumOptions()
    options.binary_location = '/usr/bin/google-chrome-stable'
    options.add_argument('--headless=new')
    options.add_argument('--start-maximized')
    options.add_argument('--disable-notifications')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://github.com/autoscrape-labs/pydoll')
        
        star_button = await tab.find(
            tag_name='button',
            timeout=5,
            raise_exc=False
        )
        if not star_button:
            print("Ops! The button was not found.")
            return

        await star_button.click()
        await asyncio.sleep(3)

        screenshot_path = os.path.join(os.getcwd(), 'pydoll_repo.png')
        await tab.take_screenshot(path=screenshot_path)
        print(f"Screenshot saved to: {screenshot_path}")

        base64_screenshot = await tab.take_screenshot(as_base64=True)

        repo_description_element = await tab.find(
            class_name='f4.my-3'
        )
        repo_description = await repo_description_element.text
        print(f"Repository description: {repo_description}")

if __name__ == "__main__":
    asyncio.run(main())
```

This extended example demonstrates:

1. Creating and configuring browser options
2. Setting a custom Chrome binary path
3. Enabling headless mode for invisible operation
4. Setting additional browser flags
5. Taking screenshots (especially useful in headless mode)

??? info "About Chromium Options"
    The `options.add_argument()` method allows you to pass any Chromium command-line argument to customize browser behavior. There are hundreds of available options to control everything from networking to rendering behavior.
    
    Common Chrome Options
    
    ```python
    # Performance & Behavior Options
    options.add_argument('--headless=new')         # Run Chrome in headless mode
    options.add_argument('--disable-gpu')          # Disable GPU hardware acceleration
    options.add_argument('--no-sandbox')           # Disable sandbox (use with caution)
    options.add_argument('--disable-dev-shm-usage') # Overcome limited resource issues
    
    # Appearance Options
    options.add_argument('--start-maximized')      # Start with maximized window
    options.add_argument('--window-size=1920,1080') # Set specific window size
    options.add_argument('--hide-scrollbars')      # Hide scrollbars
    
    # Network Options
    options.add_argument('--proxy-server=socks5://127.0.0.1:9050') # Use proxy
    options.add_argument('--disable-extensions')   # Disable extensions
    options.add_argument('--disable-notifications') # Disable notifications
    
    # Privacy & Security
    options.add_argument('--incognito')            # Run in incognito mode
    options.add_argument('--disable-infobars')     # Disable infobars
    ```
    
    Complete Reference Guides
    
    For a comprehensive list of all available Chrome command-line arguments, refer to these resources:
    
    - [Chromium Command Line Switches](https://peter.sh/experiments/chromium-command-line-switches/) - Complete reference list
    - [Chrome Flags](chrome://flags) - Enter this in your Chrome browser address bar to see experimental features
    - [Chromium Source Code Flags](https://source.chromium.org/chromium/chromium/src/+/main:chrome/common/chrome_switches.cc) - Direct source code reference
    
    Remember that some options may behave differently across Chrome versions, so it's a good practice to test your configuration when upgrading Chrome.

With these configurations, you can run Pydoll in various environments, including CI/CD pipelines, servers without displays, or Docker containers.

Continue reading the documentation to explore Pydoll's powerful features for handling captchas, working with multiple tabs, interacting with elements, and more.

## Minimal Dependencies

One of Pydoll's advantages is its lightweight footprint. Unlike other browser automation tools that require numerous dependencies, Pydoll is intentionally designed to be minimalist while maintaining powerful capabilities.

### Core Dependencies

Pydoll relies on just a few carefully selected packages:

```
python = "^3.10"
websockets = "^13.1"
aiohttp = "^3.9.5"
aiofiles = "^23.2.1"
bs4 = "^0.0.2"
```

That's it! This minimal dependency approach means:

- **Faster installation** - No complex dependency tree to resolve
- **Fewer conflicts** - Reduced chance of version conflicts with other packages
- **Smaller footprint** - Lower disk space usage
- **Better security** - Smaller attack surface and dependency-related vulnerabilities
- **Easier updates** - Simpler maintenance and fewer breaking changes

The small number of dependencies also contributes to Pydoll's reliability and performance, as there are fewer external factors that could impact its operation.

## Top Sponsors

<a href="https://substack.thewebscraping.club/p/pydoll-webdriver-scraping?utm_source=github&utm_medium=repo&utm_campaign=pydoll" target="_blank" rel="noopener nofollow sponsored">
  <img src="resources/images/banner-the-webscraping-club.png" alt="The Web Scraping Club" />
</a>

<sub>Read a full review of Pydoll on <b><a href="https://substack.thewebscraping.club/p/pydoll-webdriver-scraping?utm_source=github&utm_medium=repo&utm_campaign=pydoll" target="_blank" rel="noopener nofollow sponsored">The Web Scraping Club</a></b>, the #1 newsletter dedicated to web scraping.</sub>

## Sponsors

The support from sponsors is essential to keep the project alive, evolving, and accessible to the entire community. Each partnership helps cover costs, drive new features, and ensure ongoing development. We are truly grateful to everyone who believes in and supports the project!

<div class="sponsors-grid">
  <a href="https://www.thordata.com/?ls=github&lk=pydoll" target="_blank" rel="noopener nofollow sponsored">
    <img src="resources/images/Thordata-logo.png" alt="Thordata" />
  </a>
  <a href="https://www.testmuai.com/?utm_medium=sponsor&utm_source=pydoll" target="_blank" rel="noopener nofollow sponsored">
    <img src="resources/images/logo-lamda-test.svg" alt="LambdaTest" />
  </a>
  <a href="https://dashboard.capsolver.com/passport/register?inviteCode=WPhTbOsbXEpc" target="_blank" rel="noopener nofollow sponsored">
    <img src="resources/images/capsolver-logo.png" alt="CapSolver" />
  </a>
</div>

<p>
  <a href="https://github.com/sponsors/thalissonvs" target="_blank" rel="noopener">Become a sponsor</a>
</p>

## License

Pydoll is released under the MIT License, which gives you the freedom to use, modify, and distribute the code with minimal restrictions. This permissive license makes Pydoll suitable for both personal and commercial projects.

??? info "View Full MIT License Text"
    ```
    MIT License
    
    Copyright (c) 2023 Pydoll Contributors
    
    Permission is hereby granted, free of charge, to any person obtaining a copy
    of this software and associated documentation files (the "Software"), to deal
    in the Software without restriction, including without limitation the rights
    to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
    copies of the Software, and to permit persons to whom the Software is
    furnished to do so, subject to the following conditions:
    
    The above copyright notice and this permission notice shall be included in all
    copies or substantial portions of the Software.
    
    THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
    IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
    FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
    AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
    LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
    OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
    SOFTWARE.
    ```


================================================
FILE: docs/pt/api/browser/chrome.md
================================================
# Brower Chrome
 
::: pydoll.browser.chromium.Chrome
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2 

================================================
FILE: docs/pt/api/browser/edge.md
================================================
# Brower Edge
 
::: pydoll.browser.chromium.Edge
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2 

================================================
FILE: docs/pt/api/browser/managers.md
================================================
# Gerenciadores do Navegador

O módulo de gerenciadores (managers) fornece classes especializadas para gerenciar diferentes aspectos do ciclo de vida e configuração do navegador.

## Visão Geral

Os gerenciadores do navegador lidam com responsabilidades específicas na automação do navegador:

::: pydoll.browser.managers
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Classes de Gerenciadores

### Gerenciador de Processo do Navegador
Gerencia o ciclo de vida do processo do navegador, incluindo iniciar, parar e monitorar os processos do navegador.

::: pydoll.browser.managers.browser_process_manager
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3

### Gerenciador de Opções do Navegador
Lida com as opções de configuração do navegador e argumentos de linha de comando.

::: pydoll.browser.managers.browser_options_manager
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3

### Gerenciador de Proxy
Gerencia a configuração de proxy e autenticação para instâncias do navegador.

::: pydoll.browser.managers.proxy_manager
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3

### Gerenciador de Diretório Temporário
Lida com a criação e limpeza de diretórios temporários usados pelas instâncias do navegador.

::: pydoll.browser.managers.temp_dir_manager
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3

## Uso

Os gerenciadores são normalmente usados internamente pelas classes do navegador, como `Chrome` e `Edge`. Eles fornecem funcionalidade modular que pode ser composta:

```python
from pydoll.browser.managers.proxy_manager import ProxyManager
from pydoll.browser.managers.temp_dir_manager import TempDirManager

# Gerenciadores são usados internamente pelas classes do navegador
# O uso direto é apenas para cenários avançados
proxy_manager = ProxyManager()
temp_manager = TempDirManager()
```

!!! note "Uso Interno"
    Esses gerenciadores são usados principalmente internamente pelas classes do navegador. O uso direto é recomendado apenas para cenários avançados ou ao estender a biblioteca.


================================================
FILE: docs/pt/api/browser/options.md
================================================
# Browser Options

## ChromiumOptions

::: pydoll.browser.options.ChromiumOptions
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3

## Interface Options

::: pydoll.browser.interfaces.Options
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3

## Interface BrowserOptionsManager 

::: pydoll.browser.interfaces.BrowserOptionsManager
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3 

================================================
FILE: docs/pt/api/browser/requests.md
================================================
# Requisições do Navegador

O módulo de requisições (requests) fornece capacidades de requisição HTTP dentro do contexto do navegador, permitindo chamadas de API contínuas que herdam o estado de sessão, cookies e autenticação do navegador.

## Visão Geral

O módulo de requisições do navegador oferece uma interface semelhante à do `requests` para fazer chamadas HTTP diretamente dentro do contexto JavaScript do navegador. Esta abordagem oferece várias vantagens sobre as bibliotecas HTTP tradicionais:

- **Herança de sessão**: Manipulação automática de cookies, autenticação e CORS
- **Contexto do navegador**: As requisições são executadas no mesmo contexto de segurança da página
- **Sem malabarismo de sessão**: Elimina a necessidade de transferir cookies e tokens entre a automação e as chamadas de API
- **Compatibilidade com SPA**: Perfeito para Single Page Applications (Aplicações de Página Única) com fluxos de autenticação complexos

## Classe Request

A interface principal para fazer requisições HTTP dentro do contexto do navegador.

::: pydoll.browser.requests.request.Request
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3
      group_by_category: true
      members_order: source
      filters:
        - "!^__"

## Classe Response

Representa a resposta de requisições HTTP, fornecendo uma interface familiar semelhante à biblioteca `requests`.

::: pydoll.browser.requests.response.Response
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3
      group_by_category: true
      members_order: source
      filters:
        - "!^__"

## Exemplos de Uso

### Métodos HTTP Básicos

```python
from pydoll.browser.chromium import Chrome

async with Chrome() as browser:
    tab = await browser.start()
    await tab.go_to("https://api.example.com")
    
    # Requisição GET
    response = await tab.request.get("/users/123")
    user_data = await response.json()
    
    # Requisição POST
    response = await tab.request.post("/users", json={
        "name": "John Doe",
        "email": "john@example.com"
    })
    
    # Requisição PUT com cabeçalhos
    response = await tab.request.put("/users/123", 
        json={"name": "Jane Doe"},
        headers={"Authorization": "Bearer token123"}
    )
```

### Manipulação de Resposta

```python
# Verificar status da resposta
if response.ok:
    print(f"Sucesso: {response.status_code}")
else:
    print(f"Erro: {response.status_code}")
    response.raise_for_status()  # Levanta HTTPError para 4xx/5xx

# Acessar dados da resposta
text_data = response.text
json_data = await response.json()
raw_bytes = response.content

# Inspecionar cabeçalhos e cookies
print("Cabeçalhos da resposta:", response.headers)
print("Cabeçalhos da requisição:", response.request_headers)
for cookie in response.cookies:
    print(f"Cookie: {cookie.name}={cookie.value}")
```

### Recursos Avançados

```python
# Requisição com cabeçalhos e parâmetros customizados
response = await tab.request.get("/search", 
    params={"q": "python", "limit": 10},
    headers={
        "User-Agent": "Custom Bot 1.0",
        "Accept": "application/json"
    }
)

# Simulação de upload de arquivo
response = await tab.request.post("/upload",
    data={"description": "Test file"},
    files={"file": ("test.txt", "file content", "text/plain")}
)

# Submissão de dados de formulário
response = await tab.request.post("/login",
    data={"username": "user", "password": "pass"}
)
```

## Integração com a Aba (Tab)

A funcionalidade de requisição é acessada através da propriedade `tab.request`, que fornece uma instância `Request` singleton para cada aba:

```python
# Cada aba tem sua própria instância de requisição
tab1 = await browser.get_tab(0)
tab2 = await browser.new_tab()

# Estas são instâncias de Request separadas
request1 = tab1.request  # Requisição vinculada à tab1
request2 = tab2.request  # Requisição vinculada à tab2

# Requisições herdam o contexto da aba
await tab1.go_to("https://site1.com")
await tab2.go_to("https://site2.com")

# Estas requisições terão contextos de cookie/sessão diferentes
response1 = await tab1.request.get("/api/data")  # Usa cookies de site1.com
response2 = await tab2.request.get("/api/data")  # Usa cookies de site2.com
```

!!! tip "Automação Híbrida"
    Este módulo é particularmente poderoso para cenários de automação híbrida onde você precisa combinar interações de UI com chamadas de API. Por exemplo, faça login através da UI, depois use a sessão autenticada para chamadas de API sem manipular manualmente cookies ou tokens.

================================================
FILE: docs/pt/api/browser/tab.md
================================================
# Tab

::: pydoll.browser.tab.Tab
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/pt/api/commands/browser.md
================================================
# Comandos do Navegador

Os comandos do navegador fornecem controle de baixo nível sobre as instâncias do navegador e sua configuração.

## Visão Geral

O módulo de comandos do navegador lida com operações em nível de navegador, como informações de versão, gerenciamento de alvos (targets) e configurações globais do navegador.

::: pydoll.commands.browser_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Uso

Os comandos do navegador são tipicamente usados internamente pelas classes do navegador para gerenciar instâncias do navegador:

```python
from pydoll.commands.browser_commands import get_version
from pydoll.connection.connection_handler import ConnectionHandler

# Obter informações da versão do navegador
connection = ConnectionHandler()
version_info = await get_version(connection)
```

## Comandos Disponíveis

O módulo de comandos do navegador fornece funções para:

- Obter informações de versão do navegador e user agent
- Gerenciar alvos (targets) do navegador (abas, janelas)
- Controlar configurações e permissões globais do navegador
- Lidar com eventos do ciclo de vida do navegador

!!! note "Uso Interno"
    Esses comandos são usados principalmente internamente pelas classes de navegador `Chrome` e `Edge`. O uso direto é recomendado apenas para cenários avançados.

================================================
FILE: docs/pt/api/commands/dom.md
================================================
# Comandos DOM

Os comandos DOM fornecem funcionalidade abrangente para interagir com o Document Object Model (Modelo de Objeto de Documento) das páginas web.

## Visão Geral

O módulo de comandos DOM é um dos módulos mais importantes no Pydoll, fornecendo toda a funcionalidade necessária para encontrar, interagir com e manipular elementos HTML em páginas web.

::: pydoll.commands.dom_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Uso

Os comandos DOM são usados extensivamente pela classe `WebElement` e pelos métodos de localização de elementos:

```python
from pydoll.commands.dom_commands import query_selector, get_attributes
from pydoll.connection.connection_handler import ConnectionHandler

# Encontrar elemento e obter seus atributos
connection = ConnectionHandler()
node_id = await query_selector(connection, selector="#username")
attributes = await get_attributes(connection, node_id=node_id)
```

## Funcionalidades Principais

O módulo de comandos DOM fornece funções para:

### Localização de Elementos
- `query_selector()` - Encontrar elemento único por seletor CSS
- `query_selector_all()` - Encontrar múltiplos elementos por seletor CSS
- `get_document()` - Obter o nó raiz do documento

### Interação com Elementos
- `click_element()` - Clicar em elementos
- `focus_element()` - Focar em elementos
- `set_attribute_value()` - Definir atributos do elemento
- `get_attributes()` - Obter atributos do elemento

### Informações do Elemento
- `get_box_model()` - Obter posicionamento e dimensões do elemento
- `describe_node()` - Obter informações detalhadas do elemento
- `get_outer_html()` - Obter o conteúdo HTML do elemento

### Manipulação do DOM
- `remove_node()` - Remover elementos do DOM
- `set_node_value()` - Definir valores do elemento
- `request_child_nodes()` - Obter elementos filhos

!!! tip "APIs de Alto Nível"
    Embora esses comandos forneçam acesso poderoso de baixo nível, a maioria dos usuários deve usar os métodos de nível superior da classe `WebElement`, como `click()`, `type_text()` e `get_attribute()`, que usam esses comandos internamente.

================================================
FILE: docs/pt/api/commands/fetch.md
================================================
# Comandos Fetch

Os comandos Fetch fornecem capacidades avançadas de manipulação e interceptação de requisições de rede usando o domínio da API Fetch.

## Visão Geral

O módulo de comandos fetch permite o gerenciamento sofisticado de requisições de rede, incluindo modificação de requisições, interceptação de respostas e manipulação de autenticação.

::: pydoll.commands.fetch_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Uso

Os comandos Fetch são usados para interceptação avançada de rede e manipulação de requisições:

```python
from pydoll.commands.fetch_commands import enable, request_paused, continue_request
from pydoll.connection.connection_handler import ConnectionHandler

# Habilitar domínio fetch
connection = ConnectionHandler()
await enable(connection, patterns=[{
    "urlPattern": "*",
    "requestStage": "Request"
}])

# Lidar com requisições pausadas
async def handle_paused_request(request_id, request):
    # Modificar requisição ou continuar como está
    await continue_request(connection, request_id=request_id)
```

## Funcionalidades Principais

O módulo de comandos fetch fornece funções para:

### Interceptação de Requisição
- `enable()` - Habilitar domínio fetch com padrões
- `disable()` - Desabilitar domínio fetch
- `continue_request()` - Continuar requisições interceptadas
- `fail_request()` - Falhar requisições com erros específicos

### Modificação de Requisição
- Modificar cabeçalhos da requisição
- Alterar URLs da requisição
- Alterar métodos da requisição (GET, POST, etc.)
- Modificar corpos (bodies) da requisição

### Manipulação de Resposta
- `fulfill_request()` - Fornecer respostas customizadas
- `get_response_body()` - Obter conteúdo da resposta
- Modificação de cabeçalho de resposta
- Controle do código de status da resposta

### Autenticação
- `continue_with_auth()` - Lidar com desafios de autenticação
- Suporte a autenticação básica
- Fluxos de autenticação customizados

## Recursos Avançados

### Interceptação Baseada em Padrões
```python
# Interceptar padrões de URL específicos
patterns = [
    {"urlPattern": "*/api/*", "requestStage": "Request"},
    {"urlPattern": "*.js", "requestStage": "Response"},
    {"urlPattern": "https://example.com/*", "requestStage": "Request"}
]

await enable(connection, patterns=patterns)
```

### Modificação de Requisição
```python
# Modificar requisições interceptadas
async def modify_request(request_id, request):
    # Adicionar cabeçalho de autenticação
    headers = request.headers.copy()
    headers["Authorization"] = "Bearer token123"
    
    # Continuar com cabeçalhos modificados
    await continue_request(
        connection,
        request_id=request_id,
        headers=headers
    )
```

### Simulação de Resposta (Mocking)
```python
# Simular (mockar) respostas de API
await fulfill_request(
    connection,
    request_id=request_id,
    response_code=200,
    response_headers=[
        {"name": "Content-Type", "value": "application/json"},
        {"name": "Access-Control-Allow-Origin", "value": "*"}
    ],
    body='{"status": "success", "data": {"mocked": true}}'
)
```

### Manipulação de Autenticação
```python
# Lidar com desafios de autenticação
await continue_with_auth(
    connection,
    request_id=request_id,
    auth_challenge_response={
        "response": "ProvideCredentials",
        "username": "user",
        "password": "pass"
    }
)
```

## Estágios da Requisição

Os comandos Fetch podem interceptar requisições em diferentes estágios:

| Estágio | Descrição | Casos de Uso |
|-------|-------------|-----------|
| Requisição | Antes da requisição ser enviada | Modificar cabeçalhos, URL, método |
| Resposta | Após a resposta ser recebida | Simular respostas, modificar conteúdo |

## Manipulação de Erros

```python
# Falhar requisições com erros específicos
await fail_request(
    connection,
    request_id=request_id,
    error_reason="ConnectionRefused"  # ou "AccessDenied", "TimedOut", etc.
)
```

## Integração com Comandos de Rede (Network)

Os comandos Fetch trabalham em conjunto com os comandos de rede (Network), mas fornecem controle mais granular:

- **Comandos de Rede (Network)**: Monitoramento e controle de rede mais amplos
- **Comandos Fetch**: Interceptação e modificação específicas de requisição/resposta

!!! tip "Considerações de Performance"
    A interceptação do Fetch pode impactar a performance de carregamento da página. Use padrões de URL específicos e desabilite quando não for necessário para minimizar a sobrecarga (overhead).

================================================
FILE: docs/pt/api/commands/index.md
================================================
# Visão Geral dos Comandos

O módulo de Comandos (Commands) fornece interfaces de alto nível para interagir com os domínios do Chrome DevTools Protocol (CDP). Cada módulo de comando corresponde a um domínio CDP específico e fornece métodos para executar várias operações do navegador.

## Módulos de Comando Disponíveis

### Comandos do Navegador (Browser)
- **Módulo**: `browser_commands.py`
- **Propósito**: Operações em nível de navegador e gerenciamento de janelas
- **Documentação**: [Comandos do Navegador](browser.md)

### Comandos DOM
- **Módulo**: `dom_commands.py`
- **Propósito**: Manipulação da árvore DOM e operações de elementos
- **Documentação**: [Comandos DOM](dom.md)

### Comandos de Entrada (Input)
- **Módulo**: `input_commands.py`
- **Propósito**: Simulação de eventos de entrada (teclado, mouse, toque)
- **Documentação**: [Comandos de Entrada](input.md)

### Comandos de Rede (Network)
- **Módulo**: `network_commands.py`
- **Propósito**: Monitoramento de rede e interceptação de requisições
- **Documentação**: [Comandos de Rede](network.md)

### Comandos de Página (Page)
- **Módulo**: `page_commands.py`
- **Propósito**: Gerenciamento do ciclo de vida da página e navegação
- **Documentação**: [Comandos de Página](page.md)

### Comandos de Tempo de Execução (Runtime)
- **Módulo**: `runtime_commands.py`
- **Propósito**: Execução de JavaScript e gerenciamento de tempo de execução
- **Documentação**: [Comandos de Tempo de Execução](runtime.md)

### Comandos de Armazenamento (Storage)
- **Módulo**: `storage_commands.py`
- **Propósito**: Acesso ao armazenamento do navegador (cookies, local storage, etc.)
- **Documentação**: [Comandos de Armazenamento](storage.md)

### Comandos de Alvo (Target)
- **Módulo**: `target_commands.py`
- **Propósito**: Gerenciamento de alvos (targets) e operações de aba
- **Documentação**: [Comandos de Alvo](target.md)

### Comandos Fetch
- **Módulo**: `fetch_commands.py`
- **Propósito**: Interceptação e modificação de requisições de rede
- **Documentação**: [Comandos Fetch](fetch.md)

## Padrão de Uso

Os comandos são tipicamente acessados através das instâncias do navegador (browser) ou aba (tab):

```python
from pydoll.browser.chromium import Chrome

# Inicializa o navegador
browser = Chrome()
await browser.start()

# Obtém a aba ativa
tab = await browser.get_active_tab()

# Usa comandos através da aba
await tab.navigate("https://example.com")
element = await tab.find(id="button")
await element.click()
```

## Estrutura dos Comandos

Cada módulo de comando segue um padrão consistente:
- **Métodos estáticos**: Para execução direta de comandos
- **Dicas de tipo (Type hints)**: Segurança de tipo (type safety) completa com tipos de protocolo
- **Tratamento de erros**: Tratamento de exceção adequado para erros CDP
- **Documentação**: Docstrings abrangentes com exemplos

================================================
FILE: docs/pt/api/commands/input.md
================================================
# Comandos de Entrada (Input)

Os comandos de entrada lidam com interações de mouse e teclado, fornecendo simulação de entrada semelhante à humana.

## Visão Geral

O módulo de comandos de entrada fornece funcionalidade para simular a entrada do usuário, incluindo movimentos do mouse, cliques, digitação no teclado e pressionamento de teclas.

::: pydoll.commands.input_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Uso

Os comandos de entrada são usados por métodos de interação de elementos e podem ser usados diretamente para cenários de entrada avançados:

```python
from pydoll.commands.input_commands import dispatch_mouse_event, dispatch_key_event
from pydoll.connection.connection_handler import ConnectionHandler

# Simular clique do mouse
connection = ConnectionHandler()
await dispatch_mouse_event(
    connection, 
    type="mousePressed", 
    x=100, 
    y=200, 
    button="left"
)

# Simular digitação do teclado
await dispatch_key_event(
    connection,
    type="keyDown",
    key="Enter"
)
```

## Funcionalidades Principais

O módulo de comandos de entrada fornece funções para:

### Eventos de Mouse
- `dispatch_mouse_event()` - Cliques, movimentos e eventos de roda do mouse
- Estados dos botões do mouse (esquerdo, direito, meio)
- Posicionamento baseado em coordenadas
- Operações de arrastar e soltar (drag and drop)

### Eventos de Teclado
- `dispatch_key_event()` - Eventos de pressionar e soltar tecla
- `insert_text()` - Inserção direta de texto
- Manipulação de teclas especiais (Enter, Tab, teclas de seta, etc.)
- Teclas modificadoras (Ctrl, Alt, Shift)

### Eventos de Toque (Touch)
- Simulação de tela de toque
- Gestos multitoque (multi-touch)
- Coordenadas e pressão do toque

## Comportamento Semelhante ao Humano

Os comandos de entrada suportam padrões de comportamento semelhantes ao humano:

- Curvas naturais de movimento do mouse
- Velocidades e padrões de digitação realistas
- Micro-atrasos aleatórios entre ações
- Eventos de toque sensíveis à pressão

!!! tip "Métodos de Elemento"
    Para a maioria dos casos de uso, utilize os métodos de elemento de nível superior, como `element.click()` e `element.type_text()`, que fornecem uma API mais conveniente e lidam com cenários comuns automaticamente.

================================================
FILE: docs/pt/api/commands/network.md
================================================
# Comandos de Rede (Network)

Os comandos de rede fornecem controle abrangente sobre requisições de rede, respostas e comportamento de rede do navegador.

## Visão Geral

O módulo de comandos de rede habilita a interceptação de requisições, modificação de respostas, gerenciamento de cookies e capacidades de monitoramento de rede.

::: pydoll.commands.network_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Uso

Os comandos de rede são usados para cenários avançados como interceptação de requisições e monitoramento de rede:

```python
from pydoll.commands.network_commands import enable, set_request_interception
from pydoll.connection.connection_handler import ConnectionHandler

# Habilitar monitoramento de rede
connection = ConnectionHandler()
await enable(connection)

# Habilitar interceptação de requisições
await set_request_interception(connection, patterns=[{"urlPattern": "*"}])
```

## Funcionalidades Principais

O módulo de comandos de rede fornece funções para:

### Gerenciamento de Requisições
- `enable()` / `disable()` - Habilitar/desabilitar monitoramento de rede
- `set_request_interception()` - Interceptar e modificar requisições
- `continue_intercepted_request()` - Continuar ou modificar requisições interceptadas
- `get_request_post_data()` - Obter dados do corpo (body) da requisição

### Manipulação de Respostas
- `get_response_body()` - Obter conteúdo da resposta
- `fulfill_request()` - Fornecer respostas customizadas
- `fail_request()` - Simular falhas de rede

### Gerenciamento de Cookies
- `get_cookies()` - Obter cookies do navegador
- `set_cookies()` - Definir cookies do navegador
- `delete_cookies()` - Deletar cookies específicos
- `clear_browser_cookies()` - Limpar todos os cookies

### Controle de Cache
- `clear_browser_cache()` - Limpar cache do navegador
- `set_cache_disabled()` - Desabilitar cache do navegador
- `get_response_body_for_interception()` - Obter respostas em cache

### Segurança & Cabeçalhos
- `set_user_agent_override()` - Sobrescrever user agent
- `set_extra_http_headers()` - Adicionar cabeçalhos customizados
- `emulate_network_conditions()` - Simular condições de rede

## Casos de Uso Avançados

### Interceptação de Requisição
```python
# Interceptar e modificar requisições
await set_request_interception(connection, patterns=[
    {"urlPattern": "*/api/*", "requestStage": "Request"}
])

# Lidar com requisição interceptada
async def handle_request(request):
    if "api/login" in request.url:
        # Modificar cabeçalhos da requisição
        headers = request.headers.copy()
        headers["Authorization"] = "Bearer token"
        await continue_intercepted_request(
            connection, 
            request_id=request.request_id,
            headers=headers
        )
```

### Simulação de Resposta (Mocking)
```python
# Simular (mockar) respostas de API
await fulfill_request(
    connection,
    request_id=request_id,
    response_code=200,
    response_headers={"Content-Type": "application/json"},
    body='{"status": "success"}'
)
```

!!! warning "Impacto na Performance"
    A interceptação de rede pode impactar a performance de carregamento da página. Use seletivamente e desabilite quando não for necessário.

================================================
FILE: docs/pt/api/commands/page.md
================================================
# Comandos de Página (Page)

Os comandos de página lidam com a navegação da página, eventos do ciclo de vida e operações em nível de página.

## Visão Geral

O módulo de comandos de página fornece funcionalidade para navegar entre páginas, gerenciar o ciclo de vida da página, lidar com a execução de JavaScript e controlar o comportamento da página.

::: pydoll.commands.page_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Uso

Os comandos de página são usados extensivamente pela classe `Tab` para navegação e gerenciamento da página:

```python
from pydoll.commands.page_commands import navigate, reload, enable
from pydoll.connection.connection_handler import ConnectionHandler

# Navegar para uma URL
connection = ConnectionHandler()
await enable(connection)  # Habilitar eventos da página
await navigate(connection, url="https://example.com")

# Recarregar a página
await reload(connection)
```

## Funcionalidades Principais

O módulo de comandos de página fornece funções para:

### Navegação
- `Maps()` - Navegar para URLs
- `reload()` - Recarregar página atual
- `go_back()` - Navegar para trás no histórico
- `go_forward()` - Navegar para frente no histórico
- `stop_loading()` - Parar carregamento da página

### Ciclo de Vida da Página
- `enable()` / `disable()` - Habilitar/desabilitar eventos da página
- `get_frame_tree()` - Obter estrutura de frames da página
- `get_navigation_history()` - Obter histórico de navegação

### Gerenciamento de Conteúdo
- `get_resource_content()` - Obter conteúdo de recurso da página
- `search_in_resource()` - Pesquisar dentro de recursos da página
- `set_document_content()` - Definir conteúdo HTML da página

### Capturas de Tela & PDF
- `capture_screenshot()` - Tirar capturas de tela da página
- `print_to_pdf()` - Gerar PDF a partir da página
- `capture_snapshot()` - Capturar snapshots da página

### Execução de JavaScript
- `add_script_to_evaluate_on_new_document()` - Adicionar scripts para avaliar em novo documento (scripts de inicialização)
- `remove_script_to_evaluate_on_new_document()` - Remover scripts de inicialização

### Configurações da Página
- `set_lifecycle_events_enabled()` - Controlar eventos do ciclo de vida
- `set_ad_blocking_enabled()` - Habilitar/desabilitar bloqueio de anúncios
- `set_bypass_csp()` - Contornar (Bypass) Política de Segurança de Conteúdo (CSP)

## Recursos Avançados

### Gerenciamento de Frames
```python
# Obter todos os frames na página
frame_tree = await get_frame_tree(connection)
for frame in frame_tree.child_frames:
    print(f"Frame: {frame.frame.url}")
```

### Interceptação de Recursos
```python
# Obter conteúdo do recurso
content = await get_resource_content(
    connection, 
    frame_id=frame_id, 
    url="https://example.com/script.js"
)
```

### Eventos da Página
Os comandos de página funcionam com vários eventos de página:
- `Page.loadEventFired` - Carregamento da página concluído
- `Page.domContentEventFired` - Conteúdo DOM carregado
- `Page.frameNavigated` - Navegação do frame
- `Page.frameStartedLoading` - Carregamento do frame iniciado

!!! tip "Integração com a Classe Tab"
    A maioria das operações de página está disponível através dos métodos da classe `Tab`, como `tab.go_to()`, `tab.reload()` e `tab.screenshot()`, que fornecem uma API mais conveniente.

================================================
FILE: docs/pt/api/commands/runtime.md
================================================
# Comandos de Tempo de Execução (Runtime)

Os comandos de tempo de execução fornecem capacidades de execução de JavaScript e gerenciamento do ambiente de tempo de execução.

## Visão Geral

O módulo de comandos de tempo de execução habilita a execução de código JavaScript, inspeção de objetos e controle do ambiente de tempo de execução dentro dos contextos do navegador.

::: pydoll.commands.runtime_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Uso

Os comandos de tempo de execução são usados para execução de JavaScript e gerenciamento do tempo de execução:

```python
from pydoll.commands.runtime_commands import evaluate, enable
from pydoll.connection.connection_handler import ConnectionHandler

# Habilitar eventos de tempo de execução
connection = ConnectionHandler()
await enable(connection)

# Executar JavaScript
result = await evaluate(
    connection, 
    expression="document.title",
    return_by_value=True
)
print(result.value)  # Título da página
```

## Funcionalidades Principais

O módulo de comandos de tempo de execução fornece funções para:

### Execução de JavaScript
- `evaluate()` - Executar expressões JavaScript
- `call_function_on()` - Chamar funções em objetos
- `compile_script()` - Compilar JavaScript para reutilização
- `run_script()` - Executar scripts compilados

### Gerenciamento de Objetos
- `get_properties()` - Obter propriedades do objeto
- `release_object()` - Liberar referências de objeto
- `release_object_group()` - Liberar grupos de objetos

### Controle de Tempo de Execução
- `enable()` / `disable()` - Habilitar/desabilitar eventos de tempo de execução
- `discard_console_entries()` - Limpar entradas do console
- `set_custom_object_formatter_enabled()` - Habilitar formatadores customizados

### Manipulação de Exceções
- `set_async_call_stack_depth()` - Definir profundidade da pilha de chamadas assíncronas
- Captura e relatório de exceções
- Inspeção de objeto de erro

## Uso Avançado

### Execução de JavaScript Complexo
```python
# Executar JavaScript complexo com tratamento de erros
script = """
try {
    const elements = document.querySelectorAll('.item');
    return Array.from(elements).map(el => ({
        text: el.textContent,
        href: el.href
    }));
} catch (error) {
    return { error: error.message };
}
"""

result = await evaluate(
    connection,
    expression=script,
    return_by_value=True,
    await_promise=True
)
```

### Inspeção de Objeto
```python
# Obter propriedades detalhadas do objeto
properties = await get_properties(
    connection,
    object_id=object_id,
    own_properties=True,
    accessor_properties_only=False
)

for prop in properties:
    print(f"{prop.name}: {prop.value}")
```

### Integração com Console
Os comandos de tempo de execução se integram ao console do navegador:
- Mensagens e erros do console
- Chamadas de método da API Console
- Formatadores de console customizados

!!! note "Considerações de Performance"
    A execução de JavaScript através dos comandos de tempo de execução pode ser mais lenta do que a execução nativa do navegador. Use com moderação para operações complexas.

================================================
FILE: docs/pt/api/commands/storage.md
================================================
# Comandos de Armazenamento (Storage)

Os comandos de armazenamento fornecem gerenciamento abrangente do armazenamento do navegador, incluindo cookies, localStorage, sessionStorage e IndexedDB.

## Visão Geral

O módulo de comandos de armazenamento permite o gerenciamento de todos os mecanismos de armazenamento do navegador, fornecendo funcionalidade para persistência e recuperação de dados.

::: pydoll.commands.storage_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Uso

Os comandos de armazenamento são usados para gerenciar o armazenamento do navegador em diferentes mecanismos:

```python
from pydoll.commands.storage_commands import get_cookies, set_cookies, clear_data_for_origin
from pydoll.connection.connection_handler import ConnectionHandler

# Obter cookies para um domínio
connection = ConnectionHandler()
cookies = await get_cookies(connection, urls=["https://example.com"])

# Definir um novo cookie
await set_cookies(connection, cookies=[{
    "name": "session_id",
    "value": "abc123",
    "domain": "example.com",
    "path": "/",
    "httpOnly": True,
    "secure": True
}])

# Limpar todo o armazenamento para uma origem
await clear_data_for_origin(
    connection,
    origin="https://example.com",
    storage_types="all"
)
```

## Funcionalidades Principais

O módulo de comandos de armazenamento fornece funções para:

### Gerenciamento de Cookies
- `get_cookies()` - Obter cookies por URL ou domínio
- `set_cookies()` - Definir novos cookies
- `delete_cookies()` - Deletar cookies específicos
- `clear_cookies()` - Limpar todos os cookies

### Local Storage
- `get_dom_storage_items()` - Obter itens do localStorage
- `set_dom_storage_item()` - Definir item do localStorage
- `remove_dom_storage_item()` - Remover item do localStorage
- `clear_dom_storage()` - Limpar localStorage

### Session Storage
- Operações de session storage (semelhantes ao localStorage)
- Gerenciamento de dados específicos da sessão
- Armazenamento isolado por aba

### IndexedDB
- `get_database_names()` - Obter bancos de dados IndexedDB
- `request_database()` - Acessar a estrutura do banco de dados
- `request_data()` - Consultar dados do banco de dados
- `clear_object_store()` - Limpar object stores

### Cache Storage
- `request_cache_names()` - Obter nomes de cache
- `request_cached_response()` - Obter respostas em cache
- `delete_cache()` - Deletar entradas de cache

### Application Cache (Obsoleto)
- Suporte a cache de aplicação legado
- Cache baseado em manifesto

## Recursos Avançados

### Operações em Massa
```python
# Limpar todos os tipos de armazenamento para múltiplas origens
origins = ["https://example.com", "https://api.example.com"]
for origin in origins:
    await clear_data_for_origin(
        connection,
        origin=origin,
        storage_types="cookies,local_storage,session_storage,indexeddb"
    )
```

### Cotas de Armazenamento
```python
# Obter informações de uso e cota de armazenamento
quota_info = await get_usage_and_quota(connection, origin="https://example.com")
print(f"Usado: {quota_info.usage} bytes")
print(f"Cota: {quota_info.quota} bytes")
```

### Armazenamento Cross-Origin
```python
# Gerenciar armazenamento entre diferentes origens
await set_cookies(connection, cookies=[{
    "name": "cross_site_token",
    "value": "token123",
    "domain": ".example.com",  # Aplica-se a todos os subdomínios
    "sameSite": "None",
    "secure": True
}])
```

## Tipos de Armazenamento

O módulo suporta vários mecanismos de armazenamento:

| Tipo de Armazenamento | Persistência | Escopo | Capacidade |
|--------------|-------------|-------|----------|
| Cookies | Persistente | Domínio/Caminho | ~4KB por cookie |
| localStorage | Persistente | Origem | ~5-10MB |
| sessionStorage | Sessão | Aba | ~5-10MB |
| IndexedDB | Persistente | Origem | Grande (GB+) |
| Cache API | Persistente | Origem | Grande |

!!! warning "Considerações de Privacidade"
    Operações de armazenamento podem afetar a privacidade do usuário. Sempre lide com dados de armazenamento de forma responsável e em conformidade com as regulamentações de privacidade.

================================================
FILE: docs/pt/api/commands/target.md
================================================
# Comandos de Alvo (Target)

Os comandos de alvo (Target) gerenciam os alvos do navegador, incluindo abas, janelas e outros contextos de navegação.

## Visão Geral

O módulo de comandos de alvo fornece funcionalidade para criar, gerenciar e controlar os alvos do navegador, como abas, janelas pop-up e service workers.

::: pydoll.commands.target_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Uso

Os comandos de alvo são usados internamente pelas classes do navegador para gerenciar abas e janelas:

```python
from pydoll.commands.target_commands import get_targets, create_target, close_target
from pydoll.connection.connection_handler import ConnectionHandler

# Obter todos os alvos do navegador
connection = ConnectionHandler()
targets = await get_targets(connection)

# Criar uma nova aba
new_target = await create_target(connection, url="https://example.com")

# Fechar um alvo
await close_target(connection, target_id=new_target.target_id)
```

## Funcionalidades Principais

O módulo de comandos de alvo fornece funções para:

### Gerenciamento de Alvo
- `get_targets()` - Listar todos os alvos do navegador
- `create_target()` - Criar novas abas ou janelas
- `close_target()` - Fechar alvos específicos
- `activate_target()` - Trazer alvo para o primeiro plano

### Informações do Alvo
- `get_target_info()` - Obter informações detalhadas do alvo
- Tipos de alvo: page, background_page, service_worker, browser
- Estados do alvo: attached, detached, crashed

### Gerenciamento de Sessão
- `attach_to_target()` - Anexar a um alvo para controle
- `detach_from_target()` - Desanexar de um alvo
- `send_message_to_target()` - Enviar comandos para alvos

### Contexto do Navegador
- `create_browser_context()` - Criar contexto de navegador isolado
- `dispose_browser_context()` - Remover contexto de navegador
- `get_browser_contexts()` - Listar contextos de navegador

## Tipos de Alvos

Diferentes tipos de alvos podem ser gerenciados:

### Alvos de Página
```python
# Criar uma nova aba
page_target = await create_target(
    connection,
    url="https://example.com",
    width=1920,
    height=1080,
    browser_context_id=None  # Contexto padrão
)
```

### Janelas Pop-up
```python
# Criar uma janela pop-up
popup_target = await create_target(
    connection,
    url="https://popup.example.com",
    width=800,
    height=600,
    new_window=True
)
```

### Contextos Anônimos (Incognito)
```python
# Criar contexto de navegador anônimo
incognito_context = await create_browser_context(connection)

# Criar aba no contexto anônimo
incognito_tab = await create_target(
    connection,
    url="https://private.example.com",
    browser_context_id=incognito_context.browser_context_id
)
```

!!! info "Headless vs Headed: como os contextos se manifestam"
    Contextos de navegador são ambientes lógicos isolados. No modo **headed** (com interface gráfica), a primeira página criada dentro de um novo contexto geralmente abrirá em uma nova janela do SO. No modo **headless** (sem interface gráfica), nenhuma janela é mostrada — o isolamento permanece puramente lógico (cookies, armazenamento, cache e estado de autenticação ainda são separados por contexto). Prefira contextos em pipelines headless/CI para performance e isolamento limpo.

## Recursos Avançados

### Eventos de Alvo
Os comandos de alvo funcionam com vários eventos de alvo:
- `Target.targetCreated` - Novo alvo criado
- `Target.targetDestroyed` - Alvo fechado
- `Target.targetInfoChanged` - Informações do alvo atualizadas
- `Target.targetCrashed` - Alvo falhou (crashed)

### Coordenação Multi-Alvo
```python
# Gerenciar múltiplas abas
targets = await get_targets(connection)
page_targets = [t for t in targets if t.type == "page"]

for target in page_targets:
    # Realizar operações em cada aba
    await activate_target(connection, target_id=target.target_id)
    # ... fazer o trabalho nesta aba
```

### Isolamento de Alvo
```python
# Criar contexto de navegador isolado para testes
test_context = await create_browser_context(connection)

# Todos os alvos neste contexto estão isolados
test_tab1 = await create_target(
    connection, 
    url="https://test1.com",
    browser_context_id=test_context.browser_context_id
)

test_tab2 = await create_target(
    connection,
    url="https://test2.com", 
    browser_context_id=test_context.browser_context_id
)
```

!!! note "Integração com o Navegador"
    Os comandos de alvo são usados principalmente internamente pelas classes de navegador `Chrome` e `Edge`. As APIs de navegador de alto nível fornecem métodos mais convenientes para o gerenciamento de abas.

================================================
FILE: docs/pt/api/connection/connection.md
================================================
# Connection Handler

::: pydoll.connection.connection_handler.ConnectionHandler
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/pt/api/connection/managers.md
================================================
# Connection Managers

## CommandsManager

::: pydoll.connection.managers.commands_manager.CommandsManager
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3

## EventsManager

::: pydoll.connection.managers.events_manager.EventsManager
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3 

================================================
FILE: docs/pt/api/core/constants.md
================================================
# Constants

O módulo de constantes fornece valores predefinidos e configurações padrão para o navegador.

::: pydoll.constants
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      group_by_category: true
      members_order: source 

================================================
FILE: docs/pt/api/core/exceptions.md
================================================
# Exceptions

O módulo de exceções fornece classes de exceção personalizadas que podem ser lançadas por operações do Pydoll.

::: pydoll.exceptions
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      group_by_category: true
      members_order: source 

================================================
FILE: docs/pt/api/core/utils.md
================================================
# Utilities

O módulo de utilitários fornece funções e classes auxiliares usadas em todo o Pydoll.

::: pydoll.utils
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      group_by_category: true
      members_order: source 

================================================
FILE: docs/pt/api/elements/mixins.md
================================================
# Mixins de Elementos

O módulo de mixins (mixins) fornece funcionalidade reutilizável que pode ser misturada em classes de elementos para estender suas capacidades.

## Mixin Find Elements

O `FindElementsMixin` fornece capacidades de localização de elementos para as classes que o incluem.

::: pydoll.elements.mixins.find_elements_mixin
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Uso

Mixins são tipicamente usados internamente pela biblioteca para compor funcionalidades. O `FindElementsMixin` é usado por classes como `Tab` e `WebElement` para fornecer métodos de localização de elementos:

```python
# Estes métodos vêm do FindElementsMixin
element = await tab.find(id="username")
elements = await tab.find(class_name="item", find_all=True)
element = await tab.query("#submit-button")
```

## Métodos Disponíveis

O `FindElementsMixin` fornece vários métodos para encontrar elementos:

- `find()` - Localização de elementos moderna com argumentos nomeados (keyword arguments)
- `query()` - Consultas de seletor CSS e XPath
- `find_element()` - Método de localização de elemento legado
- `find_elements()` - Método legado para encontrar múltiplos elementos

!!! tip "Moderno vs. Legado"
    O método `find()` é a abordagem moderna e recomendada para encontrar elementos. Os métodos `find_element()` e `find_elements()` são mantidos para compatibilidade com versões anteriores.

================================================
FILE: docs/pt/api/elements/shadow_root.md
================================================
# ShadowRoot

::: pydoll.elements.shadow_root.ShadowRoot
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      members_order: source
      group_by_category: true


================================================
FILE: docs/pt/api/elements/web_element.md
================================================
# WebElement

::: pydoll.elements.web_element.WebElement
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      members_order: source
      group_by_category: true 

================================================
FILE: docs/pt/api/index.md
================================================
# Referência da API

Bem-vindo à Referência da API do Pydoll! Esta seção fornece documentação abrangente para todas as classes, métodos e funções disponíveis na biblioteca Pydoll.

---

## Visão Geral

O Pydoll está organizado em vários módulos chave, cada um servindo a um propósito específico na automação do navegador:

### Módulo Browser (Navegador)
O módulo `browser` contém classes para gerenciar instâncias de navegador e seu ciclo de vida.

* **[Chrome](browser/chrome.md)** - Automação do navegador Chrome
* **[Edge](browser/edge.md)** - Automação do navegador Microsoft Edge
* **[Options](browser/options.md)** - Opções de configuração do navegador
* **[Tab](browser/tab.md)** - Gerenciamento e interação de abas
* **[Requests](browser/requests.md)** - Requisições HTTP dentro do contexto do navegador
* **[Managers](browser/managers.md)** - Gerenciadores do ciclo de vida do navegador

### Módulo Elements (Elementos)
O módulo `elements` fornece classes para interagir com elementos de página web.

* **[WebElement](elements/web_element.md)** - Interação com elemento individual
* **[Mixins](elements/mixins.md)** - Funcionalidade de elemento reutilizável

### Módulo Connection (Conexão)
O módulo `connection` lida com a comunicação com o navegador através do Chrome DevTools Protocol.

* **[Connection Handler](connection/connection.md)** - Gerenciamento de conexão WebSocket
* **[Managers](connection/managers.md)** - Gerenciadores do ciclo de vida da conexão

### Módulo Commands (Comandos)
O módulo `commands` fornece implementações de comando de baixo nível do Chrome DevTools Protocol.

* **[Visão Geral dos Comandos](commands/index.md)** - Implementações de comando CDP por domínio

### Módulo Protocol (Protocolo)
O módulo `protocol` implementa os comandos e eventos do Chrome DevTools Protocol.

* **[Tipos Base](protocol/base.md)** - Tipos base para o Chrome DevTools Protocol
* **[Browser](protocol/browser.md)** - Comandos e eventos do domínio Browser
* **[DOM](protocol/dom.md)** - Comandos e eventos do domínio DOM
* **[Fetch](protocol/fetch.md)** - Comandos e eventos do domínio Fetch
* **[Input](protocol/input.md)** - Comandos e eventos do domínio Input
* **[Network](protocol/network.md)** - Comandos e eventos do domínio Network
* **[Page](protocol/page.md)** - Comandos e eventos do domínio Page
* **[Runtime](protocol/runtime.md)** - Comandos e eventos do domínio Runtime
* **[Storage](protocol/storage.md)** - Comandos e eventos do domínio Storage
* **[Target](protocol/target.md)** - Comandos e eventos do domínio Target

### Módulo Core (Núcleo)
O módulo `core` contém utilitários fundamentais, constantes e exceções.

* **[Constants](core/constants.md)** - Constantes e enums da biblioteca
* **[Exceptions](core/exceptions.md)** - Classes de exceção customizadas
* **[Utils](core/utils.md)** - Funções de utilidade

---

## Navegação Rápida

### Classes Mais Comuns

| Classe | Propósito | Módulo |
|-------|---------|--------|
| `Chrome` | Automação do navegador Chrome | `pydoll.browser.chromium` |
| `Edge` | Automação do navegador Edge | `pydoll.browser.chromium` |
| `Tab` | Interação e controle de abas | `pydoll.browser.tab` |
| `WebElement` | Interação com elementos | `pydoll.elements.web_element` |
| `ChromiumOptions` | Configuração do navegador | `pydoll.browser.options` |

### Enums e Constantes Chave

| Nome | Propósito | Módulo |
|------|---------|--------|
| `By` | Estratégias de seletor de elemento | `pydoll.constants` |
| `Key` | Constantes de tecla do teclado | `pydoll.constants` |
| `PermissionType` | Tipos de permissão do navegador | `pydoll.constants` |

### Exceções Comuns

| Exceção | Quando Levantada | Módulo |
|-----------|-------------|--------|
| `ElementNotFound` | Elemento não encontrado no DOM | `pydoll.exceptions` |
| `WaitElementTimeout` | Timeout de espera de elemento | `pydoll.exceptions` |
| `BrowserNotStarted` | Navegador não iniciado | `pydoll.exceptions` |

---

## Padrões de Uso

### Automação Básica do Navegador

```python
from pydoll.browser.chromium import Chrome

async with Chrome() as browser:
    tab = await browser.start()
    await tab.go_to("https://example.com")
    element = await tab.find(id="my-element")
    await element.click()
```

### Localização de Elementos

```python
# Usando o método moderno find()
element = await tab.find(id="username")
element = await tab.find(tag_name="button", class_name="submit")

# Usando seletores CSS ou XPath
element = await tab.query("#username")
element = await tab.query("//button[@class='submit']")
```

### Manipulação de Eventos

```python
await tab.enable_page_events()
await tab.on('Page.loadEventFired', handle_page_load)
```

---

## Suporte a Tipagem e Assincronismo

### Dicas de Tipo (Type Hints)
O Pydoll é totalmente tipado e fornece **dicas de tipo** abrangentes para melhor suporte da IDE e segurança de código. Todas as APIs públicas incluem anotações de tipo adequadas.

```python
from typing import Optional, List
from pydoll.elements.web_element import WebElement

# Métodos retornam objetos tipados corretamente
element: Optional[WebElement] = await tab.find(id="test", raise_exc=False)
elements: List[WebElement] = await tab.find(class_name="item", find_all=True)
```

### Suporte Async/Await
Todas as operações do Pydoll são **assíncronas** e devem ser usadas com **`async`**/**`await`**:

```python
import asyncio

async def main():
    # Todas as operações do Pydoll são assíncronas
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to("https://example.com")
        
asyncio.run(main())
```

Navegue pelas seções abaixo para explorar a documentação completa da API para cada módulo.

================================================
FILE: docs/pt/api/protocol/base.md
================================================
# Protocol Base Types

Tipos e estruturas base para comandos, respostas e eventos do Chrome DevTools Protocol.

## Base Types

::: pydoll.protocol.base
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3
      group_by_category: true
      members_order: source
      filters:
        - "!^__"

================================================
FILE: docs/pt/api/protocol/browser.md
================================================
# Protocolo do Navegador

Domínio de comandos, eventos e tipos para o Chrome DevTools Protocol.

## Métodos

::: pydoll.protocol.browser.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Eventos  

::: pydoll.protocol.browser.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Tipos

::: pydoll.protocol.browser.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/pt/api/protocol/dom.md
================================================
# Protocolo DOM

Domínio de comandos e eventos para o Chrome DevTools Protocol.

## Métodos

::: pydoll.protocol.dom.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Eventos

::: pydoll.protocol.dom.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Tipos

::: pydoll.protocol.dom.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/pt/api/protocol/fetch.md
================================================
# Protocolo Fetch

Domínio de comandos, eventos e tipos para o Chrome DevTools Protocol.

## Métodos

::: pydoll.protocol.fetch.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Eventos

::: pydoll.protocol.fetch.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Tipos

::: pydoll.protocol.fetch.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/pt/api/protocol/input.md
================================================
# Protocolo Input

Domínio de comandos, eventos e tipos para o Chrome DevTools Protocol.

## Métodos

::: pydoll.protocol.input.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Eventos

::: pydoll.protocol.input.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Tipos

::: pydoll.protocol.input.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/pt/api/protocol/network.md
================================================
# Protocolo Network

Domínio de comandos, eventos e tipos para o Chrome DevTools Protocol.

## Métodos

::: pydoll.protocol.network.methods
    options:
      show_root_heading: false
      show_source: false
      heading_level: 2

## Eventos

::: pydoll.protocol.network.events
    options:
      show_root_heading: false
      show_source: false
      heading_level: 2

## Tipos

::: pydoll.protocol.network.types
    options:
      show_root_heading: false
      show_source: false
      heading_level: 2

================================================
FILE: docs/pt/api/protocol/page.md
================================================
# Protocolo Page

Domínio de comandos, eventos e tipos para o Chrome DevTools Protocol.

## Métodos

::: pydoll.protocol.page.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Eventos

::: pydoll.protocol.page.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Tipos

::: pydoll.protocol.page.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/pt/api/protocol/runtime.md
================================================
# Protocolo Runtime

Domínio de comandos, eventos e tipos para o Chrome DevTools Protocol.

## Métodos

::: pydoll.protocol.runtime.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Eventos

::: pydoll.protocol.runtime.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Tipos

::: pydoll.protocol.runtime.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/pt/api/protocol/storage.md
================================================
# Protocolo Storage

Domínio de comandos, eventos e tipos para o Chrome DevTools Protocol.

## Métodos

::: pydoll.protocol.storage.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Eventos

::: pydoll.protocol.storage.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Tipos

::: pydoll.protocol.storage.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/pt/api/protocol/target.md
================================================
# Protocolo Target

Domínio de comandos e eventos para o Chrome DevTools Protocol.

## Métodos

::: pydoll.protocol.target.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Eventos

::: pydoll.protocol.target.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## Tipos

::: pydoll.protocol.target.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/pt/deep-dive/architecture/browser-domain.md
================================================
# Arquitetura do Domínio do Navegador

O domínio do Navegador (Browser) representa o nível mais alto da hierarquia de automação do Pydoll, gerenciando o ciclo de vida do processo do navegador, conexões CDP, isolamento de contexto e operações globais do navegador. Este documento explora a arquitetura interna, as decisões de design e a implementação técnica do controle em nível de navegador.

!!! info "Guia de Uso Prático"
    Para exemplos práticos e padrões de uso, consulte os guias [Gerenciamento do Navegador](../features/browser-management/tabs.md) e [Contextos do Navegador](../features/browser-management/contexts.md).

## Visão Geral da Arquitetura

O domínio do Navegador situa-se na interseção do gerenciamento de processos, comunicação de protocolo e coordenação de recursos. Ele orquestra múltiplos componentes especializados para fornecer uma interface unificada para a automação do navegador:

```mermaid
graph LR
    Browser[Instancia do Navegador]
    Browser --> ProcessManager[Gerenciador de Processo]
    Browser --> ProxyManager[Gerenciador de Proxy]
    Browser --> TempDirManager[Gerenciador de Diretorio Temporario]
    Browser --> TabRegistry[Registro de Abas]
    Browser --> ConnectionHandler[Manipulador de Conexao]
    
    ProcessManager --> |Gerencia| BrowserProcess[Processo do Navegador]
    ConnectionHandler <--> |WebSocket| CDP[Chrome DevTools Protocol]
    TabRegistry --> |Gerencia| Tabs[Instancias de Abas]
    CDP <--> BrowserProcess
```

### Hierarquia e Abstração

O domínio do Navegador é implementado como uma **classe base abstrata** (abstract base class) que define o contrato para todas as implementações de navegador:

```python
class Browser(ABC):
    """Classe base abstrata para automação de navegador via CDP."""
    
    @abstractmethod
    def _get_default_binary_location(self) -> str:
        """Subclasses devem fornecer o caminho do executável específico do navegador."""
        pass
    
    async def start(self, headless: bool = False) -> Tab:
        """Implementação concreta compartilhada por todos os navegadores."""
        # 1. Resolver localização do binário
        # 2. Configurar diretório de dados do usuário
        # 3. Iniciar processo do navegador
        # 4. Verificar conexão CDP
        # 5. Configurar proxy (se necessário)
        # 6. Retornar aba inicial
```

Este design permite **polimorfismo** - Chrome, Edge e outros navegadores baseados em Chromium compartilham 99% de seu código, diferindo apenas nos caminhos dos executáveis e pequenas variações de flags.

## Arquitetura de Componentes

A classe Browser coordena vários gerenciadores especializados, cada um responsável por um aspecto específico da automação do navegador. Entender esses componentes é fundamental para entender o design do Pydoll.

### Manipulador de Conexão (Connection Handler)

O ConnectionHandler é a **ponte de comunicação** entre o Pydoll e o processo do navegador. Ele gerencia:

- **Ciclo de vida do WebSocket**: Estabelecimento da conexão, keep-alive, reconexão
- **Execução de comandos**: Envio de comandos CDP e aguardo de respostas
- **Despacho de eventos**: Roteamento de eventos CDP para callbacks registrados
- **Registro de callbacks**: Manutenção de ouvintes de eventos por conexão

```python
class Browser:
    def __init__(self, ...):
        # ConnectionHandler é inicializado com a porta ou endereço WebSocket
        self._connection_handler = ConnectionHandler(self._connection_port)
    
    async def _execute_command(self, command, timeout=10):
        """Todos os comandos CDP fluem através do manipulador de conexão."""
        return await self._connection_handler.execute_command(command, timeout)
```

!!! info "Análise Profunda da Camada de Conexão"
    Para informações detalhadas sobre comunicação WebSocket, fluxo de comando/resposta e padrões assíncronos, consulte [Arquitetura da Camada de Conexão](./connection-layer.md).

### Gerenciador de Processo (Process Manager)

O BrowserProcessManager lida com o **ciclo de vida do processo do sistema operacional**:

```python
class BrowserProcessManager:
    def start_browser_process(self, binary, port, arguments):
        """
        1. Constrói a linha de comando com caminho do binário + argumentos
        2. Inicia o subprocesso com manipulação adequada de stdio
        3. Monitora a inicialização do processo
        4. Armazena o handle do processo para terminação posterior
        """
        
    def stop_process(self):
        """
        1. Tenta terminação graciosa (SIGTERM)
        2. Aguarda a saída do processo
        3. Mata forçadamente se o tempo limite for excedido (SIGKILL)
        4. Limpa os recursos do processo
        """
```

**Por que separar o gerenciamento de processos?**

- **Testabilidade**: O gerenciador de processos pode ser mockado para testes unitários
- **Multiplataforma**: Encapsula o manuseio de processos específico do SO
- **Confiabilidade**: Lida com casos extremos como processos zumbis, filhos órfãos

### Registro de Abas (Tab Registry)

O Navegador mantém um **registro de instâncias de Abas** (Tab) para garantir o comportamento singleton por alvo (target):

```python
class Browser:
    def __init__(self, ...):
        self._tabs_opened: dict[str, Tab] = {}
    
    async def new_tab(self, url='', browser_context_id=None) -> Tab:
        # Criar alvo via CDP
        response = await self._execute_command(
            TargetCommands.create_target(browser_context_id=browser_context_id)
        )
        target_id = response['result']['targetId']
        
        # Verificar se a aba já existe no registro
        if target_id in self._tabs_opened:
            return self._tabs_opened[target_id]
        
        # Criar nova instância de Aba e registrá-la
        tab = Tab(self, target_id=target_id, ...)
        self._tabs_opened[target_id] = tab
        return tab
```

**Por que instâncias de Aba singleton?**

- **Consistência de estado**: Múltiplas referências à mesma aba compartilham estado (domínios habilitados, callbacks)
- **Eficiência de memória**: Evita instâncias duplicadas de Aba para o mesmo alvo
- **Roteamento de eventos**: Garante que os eventos sejam roteados para a instância de Aba correta

### Arquitetura de Autenticação de Proxy

O Pydoll implementa **autenticação automática de proxy** através do domínio Fetch para evitar a exposição de credenciais em comandos CDP. A implementação usa **dois mecanismos distintos** dependendo do escopo do proxy:

#### Mecanismo 1: Autenticação de Proxy em Nível de Navegador (Proxy Global)

Quando um proxy é configurado via `ChromiumOptions` (aplica-se a todas as abas no contexto padrão):

```python
# Em Browser.start() -> _configure_proxy()
async def _configure_proxy(self, private_proxy, proxy_credentials):
    # Habilitar Fetch EM NÍVEL DE NAVEGADOR
    await self.enable_fetch_events(handle_auth_requests=True)
    
    # Registrar callbacks EM NÍVEL DE NAVEGADOR (afeta TODAS as abas)
    await self.on(FetchEvent.REQUEST_PAUSED, self._continue_request_callback, temporary=True)
    await self.on(FetchEvent.AUTH_REQUIRED, 
                  partial(self._continue_request_with_auth_callback,
                          proxy_username=credentials[0],
                          proxy_password=credentials[1]),
                  temporary=True)
```

**Escopo:** Conexão WebSocket em nível de navegador → afeta **todas as abas no contexto padrão**

#### Mecanismo 2: Autenticação de Proxy em Nível de Aba (Proxy por Contexto)

Quando um proxy é configurado por contexto via `create_browser_context(proxy_server=...)`:

```python
# Armazenar credenciais por contexto
async def create_browser_context(self, proxy_server, ...):
    sanitized_proxy, extracted_auth = self._sanitize_proxy_and_extract_auth(proxy_server)
    
    response = await self._execute_command(
        TargetCommands.create_browser_context(proxy_server=sanitized_proxy)
    )
    context_id = response['result']['browserContextId']
    
    if extracted_auth:
        self._context_proxy_auth[context_id] = extracted_auth  # Armazena por contexto
    
    return context_id

# Configurar autenticação para CADA aba nesse contexto
async def _setup_context_proxy_auth_for_tab(self, tab, browser_context_id):
    creds = self._context_proxy_auth.get(browser_context_id)
    if not creds:
        return
    
    # Habilitar Fetch NA ABA (WebSocket em nível de aba)
    await tab.enable_fetch_events(handle_auth=True)
    
    # Registrar callbacks NA ABA (afeta apenas esta aba)
    await tab.on(FetchEvent.REQUEST_PAUSED, 
                 partial(self._tab_continue_request_callback, tab=tab), 
                 temporary=True)
    await tab.on(FetchEvent.AUTH_REQUIRED,
                 partial(self._tab_continue_request_with_auth_callback,
                         tab=tab,
                         proxy_username=creds[0],
                         proxy_password=creds[1]),
                 temporary=True)
```

**Escopo:** Conexão WebSocket em nível de aba → afeta **apenas aquela aba específica**

#### Por Que Dois Mecanismos?

| Aspecto | Nível do Navegador | Nível da Aba |
|--------|---------------|-----------|
| **Gatilho** | Proxy em `ChromiumOptions` | Proxy em `create_browser_context()` |
| **WebSocket** | Conexão em nível de navegador | Conexão em nível de aba |
| **Escopo** | Todas as abas no contexto padrão | Apenas abas naquele contexto |
| **Eficiência** | Um ouvinte para todas as abas | Um ouvinte por aba |
| **Isolamento** | Sem separação de contexto | Cada contexto tem credenciais diferentes |

**Justificativa de design para autenticação em nível de aba:**

- **Isolamento de contexto**: Cada contexto pode ter um **proxy diferente** com **credenciais diferentes**
- **Limitação do CDP**: O domínio Fetch não pode ser escopado para um contexto específico no nível do navegador
- **Tradeoff**: Ligeiramente menos eficiente (um ouvinte por aba), mas necessário para suporte a proxy por contexto

Esta arquitetura garante que **credenciais nunca apareçam nos logs do CDP** e a autenticação seja tratada de forma transparente.

!!! warning "Efeitos Colaterais do Domínio Fetch"
    - **Fetch em Nível de Navegador**: Pausa temporariamente **todas as requisições em todas as abas** no contexto padrão até que a autenticação seja concluída
    - **Fetch em Nível de Aba**: Pausa temporariamente **todas as requisições naquela aba específica** até que a autenticação seja concluída
    
    Esta é uma limitação do CDP - o Fetch habilita a interceptação de requisições. Após a conclusão da autenticação, o Fetch é desabilitado para minimizar a sobrecarga.

## Inicialização e Ciclo de Vida

### Design do Construtor

O construtor do Navegador inicializa todos os componentes internos, mas **não inicia o processo do navegador**. Essa separação permite a configuração antes do lançamento:

```python
class Browser(ABC):
    def __init__(
        self,
        options_manager: BrowserOptionsManager,
        connection_port: Optional[int] = None,
    ):
        # 1. Validar parâmetros
        self._validate_connection_port(connection_port)
        
        # 2. Inicializar opções via gerenciador
        self.options = options_manager.initialize_options()
        
        # 3. Determinar porta CDP (aleatória se não especificada)
        self._connection_port = connection_port or randint(9223, 9322)
        
        # 4. Inicializar gerenciadores especializados
        self._proxy_manager = ProxyManager(self.options)
        self._browser_process_manager = BrowserProcessManager()
        self._temp_directory_manager = TempDirectoryManager()
        self._connection_handler = ConnectionHandler(self._connection_port)
        
        # 5. Inicializar rastreamento de estado
        self._tabs_opened: dict[str, Tab] = {}
        self._context_proxy_auth: dict[str, tuple[str, str]] = {}
        self._ws_address: Optional[str] = None
```

**Principais decisões de design:**

- **Início tardio do processo**: Construtor é síncrono; `start()` é assíncrono
- **Flexibilidade de porta**: Porta aleatória previne colisões em automação paralela
- **Padrão de gerenciador de opções**: Padrão Strategy para configuração específica do navegador
- **Composição de componentes**: Gerenciadores especializados em vez de classe monolítica

### Sequência de Início (Start)

O método `start()` orquestra o lançamento e conexão do navegador:

```python
async def start(self, headless: bool = False) -> Tab:
    # 1. Resolver localização do binário
    binary_location = self.options.binary_location or self._get_default_binary_location()
    
    # 2. Configurar diretório de dados do usuário (temporário ou persistente)
    self._setup_user_dir()
    
    # 3. Extrair credenciais do proxy (se proxy privado)
    proxy_config = self._proxy_manager.get_proxy_credentials()
    
    # 4. Iniciar processo do navegador com argumentos
    self._browser_process_manager.start_browser_process(
        binary_location, self._connection_port, self.options.arguments
    )
    
    # 5. Verificar se o endpoint CDP está responsivo
    await self._verify_browser_running()
    
    # 6. Configurar autenticação de proxy (via domínio Fetch)
    await self._configure_proxy(proxy_config[0], proxy_config[1])
    
    # 7. Obter primeiro alvo válido e criar Aba
    valid_tab_id = await self._get_valid_tab_id(await self.get_targets())
    tab = Tab(self, target_id=valid_tab_id, connection_port=self._connection_port)
    self._tabs_opened[valid_tab_id] = tab
    
    return tab
```

!!! tip "Por que start() Retorna uma Aba"
    Este é um **compromisso de design** para ergonomia. Idealmente, `start()` apenas iniciaria o navegador, e os usuários chamariam `new_tab()` separadamente. No entanto, retornar a aba inicial reduz o código boilerplate para o caso de uso de 90% (automação de aba única). O tradeoff: a aba inicial não pode ser evitada mesmo em cenários de múltiplas abas.

### Protocolo de Gerenciador de Contexto

O Navegador implementa `__aenter__` e `__aexit__` para limpeza automática:

```python
async def __aexit__(self, exc_type, exc_val, exc_tb):
    # 1. Restaurar preferências de backup (se modificadas)
    if self._backup_preferences_dir:
        shutil.copy2(self._backup_preferences_dir, ...)
    
    # 2. Verificar se o navegador ainda está em execução
    if await self._is_browser_running(timeout=2):
        await self.stop()
    
    # 3. Fechar conexão WebSocket
    await self._connection_handler.close()
```

Isso garante uma limpeza adequada mesmo se ocorrerem exceções durante a automação.

## Arquitetura de Contexto do Navegador

Contextos de navegador são o mecanismo de isolamento mais sofisticado do Pydoll, fornecendo **separação completa do ambiente de navegação** dentro de um único processo de navegador. Entender sua arquitetura é essencial para automação avançada.

### Hierarquia CDP: Navegador, Contexto, Alvo

O CDP organiza a estrutura do navegador em três níveis:

```mermaid
graph TB
    Browser[Processo do Navegador]
    Browser --> DefaultContext[Contexto de Navegador Padrao]
    Browser --> Context1[Contexto de Navegador ID: abc-123]
    Browser --> Context2[Contexto de Navegador ID: def-456]
    
    DefaultContext --> Target1[Alvo/Pagina ID: page-1]
    DefaultContext --> Target2[Alvo/Pagina ID: page-2]
    
    Context1 --> Target3[Alvo/Pagina ID: page-3]
    
    Context2 --> Target4[Alvo/Pagina ID: page-4]
    Context2 --> Target5[Alvo/Pagina ID: page-5]
```

**Conceitos-chave:**

1.  **Processo do Navegador**: Única instância do Chromium com um endpoint CDP
2.  **Contexto do Navegador (BrowserContext)**: Limite isolado de armazenamento/cache/permissão (semelhante ao modo anônimo)
3.  **Alvo (Target)**: Página individual, popup, worker ou alvo de background

### Limites de Isolamento de Contexto

Cada contexto de navegador mantém **isolamento estrito** para:

| Recurso | Nível de Isolamento | Implementação |
|----------|----------------|----------------|
| Cookies | Completo | Jarra de cookies separada por contexto |
| localStorage | Completo | Armazenamento separado por origem por contexto |
| IndexedDB | Completo | Banco de dados separado por origem por contexto |
| Cache | Completo | Cache HTTP independente por contexto |
| Permissões | Completo | Concessões de permissão específicas do contexto |
| Proxy de rede | Completo | Configuração de proxy por contexto |
| Autenticação | Completo | Estado de autenticação independente por contexto |

!!! info "Por Que Contextos São Leves"
    Ao contrário de iniciar múltiplos processos de navegador, os contextos compartilham o **mecanismo de renderização, processo de GPU e pilha de rede**. Apenas armazenamento e estado são isolados. Isso torna os contextos 10-100x mais rápidos de criar do que novas instâncias de navegador.

### Criação de Contexto e Vinculação de Alvo

Criar um contexto e um alvo envolve dois comandos CDP:

```python
# Passo 1: Criar contexto de navegação isolado
response = await self._execute_command(
    TargetCommands.create_browser_context(
        proxy_server='http://proxy.example.com:8080',
        proxy_bypass_list='localhost,127.0.0.1'
    )
)
context_id = response['result']['browserContextId']

# Passo 2: Criar alvo (página) dentro desse contexto
response = await self._execute_command(
    TargetCommands.create_target(
        browser_context_id=context_id  # Vincula o alvo ao contexto
    )
)
target_id = response['result']['targetId']
```

**Detalhe crítico:** O parâmetro `browser_context_id` **vincula o alvo ao limite de isolamento do contexto**. Sem ele, o alvo é criado no contexto padrão.

### Materialização de Janela no Modo Headed (com interface gráfica)

No **modo headed** (UI visível), os contextos do navegador têm uma restrição física importante:

-   Um contexto inicialmente existe apenas **em memória** (sem janela)
-   O **primeiro alvo** criado em um contexto **deve** abrir uma janela de nível superior
-   **Alvos subsequentes** podem abrir como abas dentro dessa janela

Esta é uma **limitação do CDP/Chromium**, não uma escolha de design do Pydoll:

```python
# Primeiro alvo no contexto: DEVE criar janela
tab1 = await browser.new_tab(browser_context_id=context_id)  # Abre nova janela

# Alvos subsequentes: PODEM abrir como abas na janela existente
tab2 = await browser.new_tab(browser_context_id=context_id)  # Abre como aba
```

**Por que isso importa?**

-   No **modo headless**: Completamente irrelevante (sem janelas renderizadas)
-   No **modo headed**: O primeiro alvo por contexto abrirá uma janela visível
-   Em **ambientes de teste**: Múltiplos contextos → múltiplas janelas (pode ser confuso)

!!! tip "Contextos Headless São Mais Limpos"
    Para CI/CD, scraping ou automação em lote, use o modo headless. O isolamento de contexto funciona identicamente, mas sem a sobrecarga de materialização de janela.

### Exclusão e Limpeza de Contexto

Excluir um contexto **fecha imediatamente todos os alvos** dentro dele:

```python
await browser.delete_browser_context(context_id)
# Todas as abas neste contexto agora estão fechadas
# Todo o armazenamento para este contexto é limpo
# O contexto não pode ser reutilizado (ID é inválido)
```

**Sequência de limpeza:**

1.  CDP envia o comando `Target.disposeBrowserContext`
2.  Navegador fecha todos os alvos naquele contexto
3.  Navegador limpa todo o armazenamento para aquele contexto
4.  Navegador invalida o ID do contexto
5.  Pydoll remove o contexto dos registros internos

## Sistema de Eventos em Nível de Navegador

O domínio do Navegador suporta **ouvintes de eventos em todo o navegador** que operam em todas as abas e contextos. Isso é distinto dos eventos em nível de aba.

### Escopo de Evento Navegador vs. Aba

```python
# Evento em nível de navegador: aplica-se a TODAS as abas
await browser.on('Target.targetCreated', handle_new_target)

# Evento em nível de aba: aplica-se a UMA aba
await tab.on('Page.loadEventFired', handle_page_load)
```

**Diferença arquitetural:**

-   **Eventos do navegador** usam a **conexão WebSocket em nível de navegador** (baseada em porta ou `ws://host/devtools/browser/...`)
-   **Eventos de aba** usam **conexões WebSocket em nível de aba** (`ws://host/devtools/page/<target_id>`)

### Domínio Fetch: Interceptação Global de Requisições

O domínio Fetch pode ser habilitado nos níveis de **navegador e aba**, com escopos diferentes:

```python
# Fetch em nível de navegador: intercepta requisições para TODAS as abas
await browser.enable_fetch_events(handle_auth_requests=True)
await browser.on('Fetch.requestPaused', handle_request)

# Fetch em nível de aba: intercepta requisições para UMA aba
await tab.enable_fetch_events(handle_auth_requests=True)
await tab.on('Fetch.requestPaused', handle_request)
```

**Quando usar cada um:**

| Caso de Uso | Nível | Razão |
|----------|-------|--------|
| Autenticação de proxy | Navegador | Aplica-se globalmente a todos os contextos |
| Bloqueio de anúncios | Navegador | Bloquear anúncios em todas as abas |
| Mocking de API | Aba | Mockar API específica para teste específico |
| Log de requisições | Aba | Registrar apenas requisições da aba relevante |

!!! warning "Impacto de Performance do Fetch"
    Habilitar o Fetch no nível do navegador **pausa todas as requisições** em todas as abas até que os callbacks sejam executados. Isso adiciona latência a cada requisição. Use o Fetch em nível de aba quando possível para minimizar o impacto.

### Roteamento de Comandos

Todos os comandos CDP fluem através do manipulador de conexão do Navegador:

```python
async def _execute_command(self, command, timeout=10):
    """
    Roteia o comando para a conexão apropriada:
    - Comandos em nível de navegador → WebSocket do navegador
    - Comandos em nível de aba → delegados para a instância da Aba
    """
    return await self._connection_handler.execute_command(command, timeout)
```

Este roteamento centralizado permite:

-   **Correlação requisição/resposta**: Corresponder respostas a requisições via ID
-   **Gerenciamento de timeout**: Cancelar comandos que excedem o tempo limite
-   **Tratamento de erros**: Converter erros CDP em exceções Python

## Gerenciamento de Recursos

### Operações de Cookies e Armazenamento

O domínio do Navegador expõe operações de armazenamento **em todo o navegador** e **específicas do contexto**:

```python
# Operações em nível de navegador (todos os contextos)
await browser.set_cookies(cookies)
await browser.get_cookies()
await browser.delete_all_cookies()

# Operações específicas do contexto
await browser.set_cookies(cookies, browser_context_id=context_id)
await browser.get_cookies(browser_context_id=context_id)
await browser.delete_all_cookies(browser_context_id=context_id)
```

Essas operações usam o **domínio Storage** internamente:

-   `Storage.getCookies`: Recupera cookies para o contexto ou todos os contextos
-   `Storage.setCookies`: Define cookies com domínio/caminho/validade
-   `Storage.clearCookies`: Limpa cookies para o contexto ou todos os contextos

!!! info "Escopo de Armazenamento Navegador vs. Aba"
    - **Nível do Navegador**: Opera no navegador inteiro ou contexto específico
    - **Nível da Aba**: Escopado para a origem atual da aba
    
    Use o nível do navegador para gerenciamento global de cookies (ex: definir cookies de sessão para todos os domínios). Use o nível da aba para operações específicas da origem (ex: limpar cookies após logout).

### Concessões de Permissão

O domínio do Navegador fornece **controle programático de permissões**, contornando os prompts do navegador:

```python
await browser.grant_permissions(
    [PermissionType.GEOLOCATION, PermissionType.NOTIFICATIONS],
    origin='https://example.com',
    browser_context_id=context_id
)
```

**Arquitetura:**

-   Permissões são concedidas via comando CDP `Browser.grantPermissions`
-   Permissões são **específicas do contexto** (isoladas por contexto)
-   Concessões sobrescrevem o comportamento padrão de prompt
-   `reset_permissions()` reverte para o comportamento padrão

### Gerenciamento de Download

O comportamento de download é configurado através do comando `Browser.setDownloadBehavior`:

```python
await browser.set_download_behavior(
    behavior=DownloadBehavior.ALLOW,
    download_path='/path/to/downloads',
    events_enabled=True,  # Emitir eventos de progresso de download
    browser_context_id=context_id
)
```

**Opções:**

-   `ALLOW`: Salvar no caminho especificado
-   `DENY`: Cancelar todos os downloads
-   `DEFAULT`: Mostrar UI de download padrão do navegador

### Gerenciamento de Janela

Operações de janela aplicam-se à **janela física do SO** de um alvo:

```python
window_id = await browser.get_window_id_for_target(target_id)
await browser.set_window_bounds({
    'left': 100, 'top': 100,
    'width': 1920, 'height': 1080,
    'windowState': 'normal'  # ou 'minimized', 'maximized', 'fullscreen'
})
```

**Detalhes da implementação:**

-   Usa `Browser.getWindowForTarget` para resolver o ID da janela a partir do ID do alvo
-   `Browser.setWindowBounds` modifica a geometria da janela
-   **Modo headless**: Operações de janela são no-ops (não existem janelas físicas)

## Insights Arquiteturais e Tradeoffs de Design

### Registro Singleton de Abas: Por quê?

O padrão de registro de abas (`_tabs_opened: dict[str, Tab]`) garante que:

1.  **Roteamento de eventos funcione corretamente**: Eventos CDP contêm um `targetId`, mas nenhuma referência de Aba. O registro mapeia `targetId` → `Tab` para o despacho correto do callback.
2.  **Consistência de estado**: Múltiplos caminhos de código que referenciam o mesmo alvo obtêm a **mesma instância de Aba**, prevenindo divergência de estado.
3.  **Eficiência de memória**: Sem o registro, `get_opened_tabs()` criaria instâncias duplicadas de Aba a cada chamada.

**Tradeoff:** O uso de memória cresce com a contagem de abas, mas isso é inevitável para instâncias de Aba com estado (stateful).

### Por que start() Retorna uma Aba

Esta decisão de design sacrifica a pureza pela **ergonomia**:

-   **Desvantagem**: A aba inicial não pode ser evitada, mesmo em automação de múltiplas abas
-   **Vantagem**: 90% dos usuários (scripts de aba única) não precisam de boilerplate:

```python
# Com start() retornando Aba
tab = await browser.start()

# Sem (design puro)
await browser.start()
tab = await browser.new_tab()
```

**Alternativa explorada:** Fechar automaticamente a aba inicial em `new_tab()`. Rejeitada porque é um comportamento surpreendente (efeitos colaterais implícitos).

### Autenticação de Proxy: Tradeoff da Arquitetura de Dois Níveis

A autenticação de proxy do Pydoll usa duas estratégias diferentes do domínio Fetch:

**Nível do Navegador (Proxy Global):**
-   **Benefício de segurança**: Credenciais nunca registradas em logs CDP
-   **Custo de performance**: Fetch pausa **todas as requisições em todas as abas** até que a autenticação seja concluída
-   **Eficiência**: Único ouvinte para todas as abas no contexto padrão
-   **Mitigação**: Fetch é desabilitado após a primeira autenticação, minimizando a sobrecarga

**Nível da Aba (Proxy por Contexto):**
-   **Benefício de segurança**: Credenciais nunca registradas em logs CDP
-   **Custo de performance**: Fetch pausa **todas as requisições naquela aba** até que a autenticação seja concluída
-   **Eficiência**: Ouvinte separado por aba (menos eficiente, mas necessário para isolamento)
-   **Benefício de isolamento**: Cada contexto pode ter credenciais de proxy diferentes
-   **Mitigação**: Fetch é desabilitado após a primeira autenticação por aba

**Por que não usar `Browser.setProxyAuth`?** Este comando CDP não existe. Fetch é o único mecanismo para autenticação programática.

**Por que em nível de aba para contextos?** O domínio Fetch do CDP não pode ser escopado para um BrowserContext específico. Como cada contexto pode ter um proxy diferente com credenciais diferentes, o Pydoll deve lidar com a autenticação no nível da aba para respeitar os limites do contexto.

### Estratégia de Randomização de Porta

Portas CDP aleatórias (9223-9322) previnem colisões ao executar instâncias paralelas de navegador:

```python
self._connection_port = connection_port or randint(9223, 9322)
```

**Por que não incrementar a partir de 9222?**

-   Condições de corrida em ambientes multiprocesso (ex: pytest-xdist)
-   Colisão com a seleção manual de porta do usuário

**Tradeoff:** Portas aleatórias são mais difíceis de depurar (não podem ser hardcoded). Solução: `browser._connection_port` expõe a porta escolhida.

### Separação de Componentes: Por que Gerenciadores?

A classe Browser delega para gerenciadores especializados (ProcessManager, ProxyManager, TempDirManager, ConnectionHandler) para:

1.  **Testabilidade**: Gerenciadores podem ser mockados independentemente
2.  **Reusabilidade**: Lógica do ProxyManager compartilhada entre implementações do Browser
3.  **Manutenibilidade**: Cada gerenciador tem responsabilidade única
4.  **Multiplataforma**: Lógica específica do SO isolada no ProcessManager

**Tradeoff:** Mais indireção, mas organização de código significativamente melhor em escala.

## Principais Tópicos

1.  **Navegador é um coordenador**, não um monolito. Ele orquestra gerenciadores e lida com a comunicação CDP.
2.  **Registro de abas garante instâncias singleton** por alvo, crítico para roteamento de eventos e consistência de estado.
3.  **Contextos de navegador são isolamento leve**, compartilhando o processo do navegador mas separando armazenamento/cache/autenticação.
4.  **Autenticação de proxy via Fetch** é um tradeoff de segurança - esconde credenciais mas adiciona latência.
5.  **Sistema de eventos tem dois níveis**: Em todo o navegador e específico da aba, com diferentes conexões WebSocket.
6.  **Separação de componentes** (gerenciadores) melhora a testabilidade e o suporte multiplataforma.

## Documentação Relacionada

Para um entendimento mais profundo dos componentes arquiteturais relacionados:

- **[Camada de Conexão](./connection-layer.md)**: Comunicação WebSocket, fluxo de comando/resposta, padrões assíncronos
- **[Arquitetura de Eventos](./event-architecture.md)**: Despacho de eventos, gerenciamento de callback, habilitação de domínio
- **[Domínio da Aba](./tab-domain.md)**: Operações em nível de aba, navegação de página, localização de elementos
- **[Análise Profunda do CDP](./cdp.md)**: Fundamentos do Chrome DevTools Protocol
- **[Arquitetura de Proxy](./proxy-architecture.md)**: Conceitos e implementação de proxy em nível de rede

Para padrões de uso prático:

- **[Gerenciamento de Abas](../features/browser-management/tabs.md)**: Padrões de automação de múltiplas abas
- **[Contextos do Navegador](../features/browser-management/contexts.md)**: Isolamento de contexto na prática
- **[Configuração de Proxy](../features/configuration/proxy.md)**: Configurando proxies e autenticação

================================================
FILE: docs/pt/deep-dive/architecture/browser-requests-architecture.md
================================================
# Arquitetura de Requisições no Contexto do Navegador

Este documento explora o design arquitetural do sistema de requisições HTTP no contexto do navegador do Pydoll, que permite fazer requisições HTTP que herdam perfeitamente o estado de sessão, cookies e autenticação do navegador.

!!! info "Guia Prático Disponível"
    Esta é a análise profunda da arquitetura. Para exemplos práticos e casos de uso, consulte o [Guia de Requisições HTTP](../features/network/http-requests.md).

## Visão Geral da Arquitetura

Requisições no contexto do navegador resolvem um problema fundamental na automação híbrida: manter a continuidade da sessão entre interações de UI e chamadas de API. Abordagens tradicionais exigem a extração manual de cookies e cabeçalhos, criando um acoplamento frágil entre o navegador e o cliente HTTP.

A arquitetura do Pydoll elimina essa complexidade executando requisições HTTP **dentro** do contexto JavaScript do navegador, enquanto aproveita os eventos de rede do CDP para capturar metadados abrangentes que o JavaScript sozinho não pode fornecer.

### Por Que Essa Arquitetura?

| Abordagem Tradicional | Arquitetura Pydoll |
|---------------------|---------------------|
| Cliente HTTP separado (requests, aiohttp) | Execução unificada baseada no navegador |
| Extração e sincronização manual de cookies | Herança automática de cookies |
| Dois estados de sessão separados | Estado de sessão único |
| Manipulação limitada de CORS | Aplicação nativa de CORS do navegador |
| Fluxos de autenticação complexos | Preservação transparente da autenticação |


## Arquitetura de Componentes

O sistema de requisições no contexto do navegador consiste em duas classes principais que trabalham juntas com o sistema de eventos do Pydoll:

```mermaid
classDiagram
    class Tab {
        +request: Request
        +enable_network_events()
        +disable_network_events()
        +get_network_response_body()
        +on(event_name, callback)
        +clear_callbacks()
    }
    
    class Request {
        -tab: Tab
        -_network_events_enabled: bool
        -_requests_sent: list
        -_requests_received: list
        +get(url, params, kwargs)
        +post(url, data, json, kwargs)
        +put(url, data, json, kwargs)
        +patch(url, data, json, kwargs)
        +delete(url, kwargs)
        +head(url, kwargs)
        +options(url, kwargs)
        -_execute_fetch_request()
        -_register_callbacks()
        -_extract_headers()
        -_extract_cookies()
    }
    
    class Response {
        -_status_code: int
        -_content: bytes
        -_text: str
        -_json: dict
        -_response_headers: list
        -_request_headers: list
        -_cookies: list
        -_url: str
        +ok: bool
        +status_code: int
        +text: str
        +content: bytes
        +url: str
        +headers: list
        +request_headers: list
        +cookies: list
        +json()
        +raise_for_status()
    }
    
    Tab *-- Request
    Request ..> Response : cria
    Request ..> Tab : usa eventos
```

### Classe Request

A classe `Request` serve como a camada de interface, fornecendo uma API familiar semelhante à do `requests` enquanto orquestra a interação complexa entre a execução de JavaScript e o monitoramento de eventos de rede.

**Principais Responsabilidades:**

- Traduzir chamadas de método Python para JavaScript da API Fetch
- Gerenciar ouvintes (listeners) de eventos de rede temporários
- Acumular eventos de rede durante a execução da requisição
- Extrair metadados de eventos CDP
- Construir objetos Response com informações completas

### Classe Response

A classe `Response` fornece uma interface compatível com `requests.Response`, tornando a migração de clientes HTTP tradicionais contínua.

**Principais Características:**

- Múltiplos acessadores de conteúdo (texto, bytes, JSON)
- Análise (parsing) preguiçosa (lazy) de JSON com cache
- Informações abrangentes de cabeçalho (enviados e recebidos)
- Extração de cookies dos cabeçalhos Set-Cookie
- URL final após redirecionamentos

## Fluxo de Execução

A execução da requisição segue um pipeline de seis fases:

```mermaid
flowchart TD
    Start([tab.request.get#40;url#41;]) --> Phase1[<b>1. Preparação</b><br/>Construir URL + opções]
    
    Phase1 --> Phase2[<b>2. Registro de Eventos</b><br/>Habilitar eventos de rede<br/>Registrar callbacks]
    
    Phase2 --> Phase3[<b>3. Execução JavaScript</b><br/>Runtime.evaluate&#40;fetch&#41;]
    
    Phase3 --> Phase4{<b>4. Atividade de Rede</b>}
    Phase4 -->|Requisição enviada| Event1[REQUEST_WILL_BE_SENT]
    Phase4 -->|Resposta recebida| Event2[RESPONSE_RECEIVED]
    Phase4 -->|Informação extra| Event3[Eventos *_EXTRA_INFO]
    
    Event1 --> Collect[Coletar metadados]
    Event2 --> Collect
    Event3 --> Collect
    
    Collect --> Phase5[<b>5. Construção</b><br/>Extrair cabeçalhos/cookies<br/>Construir objeto Response]
    
    Phase5 --> Phase6[<b>6. Limpeza</b><br/>Limpar callbacks<br/>Desabilitar eventos]
    
    Phase6 --> End([Retornar Response])
```

### Detalhes das Fases

| Fase | Camada | Operações Principais | Assíncrono |
|-------|-------|----------------|--------------|
| **1. Preparação** | Request | Construção de URL, formatação de opções | Não |
| **2. Registro de Eventos** | Tab | Habilitar eventos, registrar callbacks | Sim |
| **3. Execução JavaScript** | CDP/Navegador | Executar fetch() no contexto do navegador | Sim |
| **4. Atividade de Rede** | Navegador/CDP | Requisição HTTP, emitir eventos CDP | Sim (paralelo) |
| **5. Construção** | Request | Analisar eventos, construir Response | Não |
| **6. Limpeza** | Tab | Remover callbacks, desabilitar eventos | Sim |

## Integração com o Sistema de Eventos

Requisições no contexto do navegador são fortemente integradas com a arquitetura do sistema de eventos do Pydoll. Entender essa relação é crucial.

### Ciclo de Vida de Eventos Temporários

```mermaid
stateDiagram-v2
    [*] --> NoEvents: Requisição inicia
    NoEvents --> EventsEnabled: Habilitar eventos de rede
    EventsEnabled --> CallbacksRegistered: Registrar callbacks
    CallbacksRegistered --> ExecutingRequest: Executar fetch
    ExecutingRequest --> CapturingEvents: Eventos disparam
    CapturingEvents --> ExecutingRequest: Mais eventos
    ExecutingRequest --> CleaningUp: Fetch completa
    CleaningUp --> CallbacksRemoved: Limpar callbacks
    CallbacksRemoved --> EventsDisabled: Desabilitar se necessário
    EventsDisabled --> [*]: Requisição completa
```

### Por Que Usar Ambos, JavaScript e Eventos?

Uma pergunta comum: se o JavaScript pode executar a requisição, por que usar eventos de rede?

| Fonte da Informação | JavaScript (API Fetch) | Eventos de Rede (CDP) |
|-------------------|------------------------|----------------------|
| Status da resposta | Disponível | Disponível |
| Corpo da resposta | Disponível | Não disponível |
| Cabeçalhos da resposta | Parcial (restrito por CORS) | Completo |
| Cabeçalhos da requisição | Não acessível | Completo |
| Cabeçalhos Set-Cookie | Ocultos pelo navegador | Disponível |
| Informações de tempo (timing) | Limitadas | Abrangentes |
| Cadeia de redirecionamento | Apenas URL final | Cadeia completa |

**A Solução:** Combinar ambas as fontes para informações completas.

!!! tip "Tecnologias Complementares"
    O JavaScript fornece o corpo da resposta e dispara a requisição no contexto do navegador (com cookies, autenticação). Os eventos de rede fornecem os metadados que as políticas de segurança do JavaScript ocultam.

### Tipos de Eventos de Rede CDP

A arquitetura usa quatro tipos de eventos CDP para capturar metadados completos:

| Evento | Propósito | Informação Chave |
|-------|---------|----------------|
| `REQUEST_WILL_BE_SENT` | Requisição principal de saída | URL, método, cabeçalhos padrão |
| `REQUEST_WILL_BE_SENT_EXTRA_INFO` | Metadados adicionais da requisição | Cookies associados, cabeçalhos brutos |
| `RESPONSE_RECEIVED` | Resposta principal recebida | Status, cabeçalhos, tipo MIME, tempo |
| `RESPONSE_RECEIVED_EXTRA_INFO` | Metadados adicionais da resposta | Cabeçalhos Set-Cookie, informações de segurança |

!!! info "Multiplicidade de Eventos"
    Uma única requisição HTTP gera múltiplos eventos CDP. A classe Request acumula todos os eventos relacionados e extrai informações não duplicadas durante a fase de construção.

## Arquitetura de Cabeçalhos e Cookies

### Estratégia de Extração de Cabeçalhos

Cabeçalhos existem em múltiplos eventos CDP com potencial duplicação. A arquitetura usa uma estratégia de desduplicação:

```mermaid
flowchart TD
    A[Eventos de Rede] --> B{Tipo de Evento}
    B -->|Eventos REQUEST| C[Extrair Cabeçalhos Enviados]
    B -->|Eventos RESPONSE| D[Extrair Cabeçalhos Recebidos]
    
    C --> E[Desduplicar por nome+valor]
    D --> F[Desduplicar por nome+valor]
    
    E --> G[Lista de Cabeçalhos da Requisição]
    F --> H[Lista de Cabeçalhos da Resposta]
    
    G --> I[Objeto Response]
    H --> I
```

**Lógica de Desduplicação:**

1. Eventos são processados em ordem
2. Cada cabeçalho é identificado pela tupla `(nome, valor)`
3. Apenas a primeira ocorrência de cada tupla é mantida
4. Resultado: lista de cabeçalhos única e não redundante

### Arquitetura de Análise de Cookies

Cookies exigem tratamento especial porque vêm dos cabeçalhos `Set-Cookie` nos eventos `RESPONSE_RECEIVED_EXTRA_INFO`:

```mermaid
flowchart TD
    A[RESPONSE_RECEIVED_EXTRA_INFO] --> B[Extrair cabeçalhos Set-Cookie]
    B --> C{Cabeçalho multi-linha?}
    C -->|Sim| D[Dividir por nova linha]
    C -->|Não| E[Analisar cookie único]
    D --> F[Analisar cada linha]
    F --> G[Extrair nome=valor]
    E --> G
    G --> H{Nome válido?}
    H -->|Sim| I[Criar CookieParam]
    H -->|Não| J[Descartar]
    I --> K[Adicionar à lista de cookies]
    K --> L[Desduplicar]
    L --> M[Objeto Response]
```

**Princípios de Extração de Cookies:**

- Apenas eventos `EXTRA_INFO` contêm cabeçalhos `Set-Cookie`
- Atributos de cookie (Path, Domain, Secure, HttpOnly) são ignorados
- O navegador gerencia atributos de cookie internamente
- Apenas pares nome-valor são extraídos para fins informativos

!!! warning "Escopo dos Cookies"
    A propriedade `Response.cookies` contém apenas cookies **novos ou atualizados** desta resposta específica. Cookies existentes do navegador são gerenciados automaticamente e não expostos através desta interface.

## Contexto de Execução JavaScript

A execução da API Fetch acontece no contexto JavaScript do navegador, o que é fundamental para o poder da arquitetura:

### Integração com a API Fetch

A requisição é traduzida para JavaScript:

```javascript
// Representação simplificada
(async () => {
    const response = await fetch(url, {
        method: 'GET',
        headers: {'X-Custom': 'value'},
        // O navegador adiciona automaticamente:
        // - Cabeçalho Cookie
        // - Authorization se definido
        // - Cabeçalhos padrão (User-Agent, Accept, etc.)
    });
    
    return {
        status: response.status,
        url: response.url,  // URL final após redirecionamentos
        text: await response.text(),
        content: new Uint8Array(await response.arrayBuffer()),
        json: response.headers.get('Content-Type')?.includes('application/json')
            ? await response.clone().json()
            : null
    };
})()
```

### Benefícios do Contexto do Navegador

Executar no contexto do navegador fornece:

| Benefício | Descrição |
|---------|-------------|
| **Inclusão Automática de Cookies** | O navegador envia todos os cookies aplicáveis automaticamente |
| **Preservação do Estado de Autenticação** | Cabeçalhos de autenticação mantidos da sessão do navegador |
| **Aplicação de CORS** | O navegador aplica as mesmas políticas CORS das interações do usuário |
| **Manipulação de TLS/SSL** | A validação de certificado e políticas de segurança do navegador se aplicam |
| **Compressão** | Manipulação automática de gzip, br, deflate |
| **Redirecionamentos** | O navegador segue redirecionamentos transparentemente |
| **Mesmo Contexto de Segurança** | A requisição parece idêntica às requisições iniciadas pelo usuário |

!!! info "Detecção Anti-Bot"
    Requisições executadas no contexto do navegador são indistinguíveis de requisições iniciadas pelo usuário, tornando-as eficazes contra sistemas anti-bot que analisam padrões de requisição.

## Considerações de Performance

### Sobrecarga de Eventos

Eventos de rede adicionam sobrecarga à execução da requisição:

| Cenário | Sobrecarga | Recomendação |
|----------|----------|----------------|
| Requisição única | Baixa | Aceitável |
| Múltiplas requisições sequenciais | Moderada | Habilitar eventos uma vez |
| Requisições em massa (100+) | Alta | Considere habilitar eventos no nível da aba |
| Automação de longa duração | Preocupação com memória | Desabilitar quando terminar |

### Padrão de Otimização

```python
# Ineficiente - eventos habilitados/desabilitados repetidamente
for url in urls:
    response = await tab.request.get(url)

# Eficiente - eventos habilitados uma vez
await tab.enable_network_events()
for url in urls:
    response = await tab.request.get(url)
await tab.disable_network_events()
```

!!! tip "Otimização Automática"
    A classe Request verifica se os eventos de rede já estão habilitados e pula operações redundantes de habilitar/desabilitar automaticamente.

### Estratégia de Análise JSON

A análise JSON da resposta usa avaliação preguiçosa (lazy) com cache:

1. Primeira chamada a `response.json()`: Analisa e armazena em cache
2. Chamadas subsequentes: Retorna resultado do cache
3. Se o JSON foi pré-analisado durante a construção: Usa esse

Isso previne sobrecarga de análise redundante.

## Arquitetura de Segurança

### Aplicação da Política CORS

Requisições no contexto do navegador respeitam as políticas CORS:

```mermaid
flowchart TD
    A[tab.request.get&#40;url&#41;] --> B{Mesma Origem?}
    B -->|Sim| C[Requisição Permitida]
    B -->|Não| D{Cabeçalhos CORS Presentes?}
    D -->|Sim| E[Requisição Permitida]
    D -->|Não| F[Requisição Bloqueada]
    
    C --> G[Resposta Retornada]
    E --> G
    F --> H[Erro CORS]
```

**Comportamento do CORS:**

- Requisições para mesma origem: Sempre permitidas
- Requisições cross-origin: Exigem cabeçalhos CORS do servidor
- Respostas opacas: Podem ser bloqueadas pelo navegador

**Solução para problemas de CORS:**

Navegue para o domínio primeiro para estabelecer um contexto de mesma origem:

```python
await tab.go_to('https://different-domain.com')
response = await tab.request.get('https://different-domain.com/api')
```

### Segurança de Cookies

Cookies com flags de segurança (`HttpOnly`, `Secure`, `SameSite`) são manipulados pelo navegador:

- **Cookies HttpOnly**: Enviados automaticamente, mas não expostos ao JavaScript ou CDP
- **Cookies Secure**: Enviados apenas sobre HTTPS
- **Cookies SameSite**: O navegador aplica as políticas SameSite

A propriedade `Response.cookies` pode não mostrar todos os cookies devido a essas restrições de segurança.

### Validação TLS/SSL

O navegador valida certificados SSL. Certificados autoassinados ou inválidos fazem com que as requisições falhem, a menos que:

```python
options = ChromiumOptions()
options.add_argument('--ignore-certificate-errors')
browser = Chrome(options=options)
```

!!! warning "Compromisso de Segurança"
    Desabilitar a validação de certificados reduz a segurança. Use apenas em ambientes controlados.

## Limitações e Decisões de Design

### Tamanho do Corpo da Requisição

Corpos de requisição muito grandes (arquivos, grandes conjuntos de dados) têm restrições de memória do JavaScript. Para uploads de arquivos, use `WebElement.set_input_files()` ou o interceptador de seletor de arquivos.

### Manipulação de Resposta Binária

Respostas binárias são convertidas através do `ArrayBuffer` e `Uint8Array` do JavaScript, o que adiciona alguma sobrecarga para respostas muito grandes (>100MB).

### Transparência de Redirecionamento

A API Fetch segue redirecionamentos automaticamente. Apenas a URL final é capturada. Se você precisar da cadeia de redirecionamento, use o monitoramento de rede separadamente.

### Temporização de Eventos

Eventos devem ser registrados **antes** de executar o fetch. A arquitetura garante isso através da fase de registro, mas o manuseio manual de eventos requer uma temporização cuidadosa.

## Princípios Arquiteturais

A arquitetura de requisições no contexto do navegador adere a estes princípios:

1. **Continuidade da Sessão**: Nunca quebrar o estado de sessão do navegador
2. **Sincronização Manual Zero**: Nenhuma extração de cookie/cabeçalho necessária
3. **Informação Completa**: Combinar JavaScript + eventos para metadados completos
4. **Limpeza Automática**: Recursos liberados após cada requisição
5. **Interface Familiar**: API compatível com `requests` para fácil adoção
6. **Consciente de Performance**: Otimizar para casos de uso comuns
7. **Consciente de Segurança**: Respeitar as políticas de segurança do navegador

## Integração com Outros Sistemas

### Dependência do Sistema de Eventos

Requisições no contexto do navegador dependem da arquitetura do sistema de eventos:

- Utiliza `Tab.on()` para registro de callback
- Usa `Tab.clear_callbacks()` para limpeza
- Respeita a habilitação existente de eventos de rede
- Integra-se com o gerenciamento do ciclo de vida dos eventos

Veja [Arquitetura do Sistema de Eventos](event-architecture.md) para detalhes.

### Integração com o Sistema de Tipos

A arquitetura usa o sistema de tipos do Python extensivamente:

- `HeaderEntry` TypedDict para cabeçalhos
- `CookieParam` TypedDict para cookies
- Definições de tipo de evento de `pydoll.protocol.network.events`
- Fornece autocomplete na IDE e segurança de tipos

Veja [Sistema de Tipagem](typing-system.md) para detalhes.

## Leitura Adicional

- **[Guia de Requisições HTTP](../features/network/http-requests.md)** - Exemplos práticos e casos de uso
- **[Arquitetura do Sistema de Eventos](event-architecture.md)** - Design interno do sistema de eventos
- **[Monitoramento de Rede](../features/network/monitoring.md)** - Observação passiva de rede
- **[Interceptação de Requisições](../features/network/interception.md)** - Modificação ativa de requisições
- **[Sistema de Tipagem](typing-system.md)** - Integração do sistema de tipos

## Resumo

A arquitetura de requisições no contexto do navegador do Pydoll alcança comunicação HTTP contínua combinando a execução da API Fetch do JavaScript com o monitoramento de eventos de rede do CDP. Esta abordagem híbrida fornece:

- **Metadados completos** de ambos os eventos JavaScript e CDP
- **Continuidade automática da sessão** através da execução no contexto do navegador  
- **Interface familiar** compatível com a biblioteca requests
- **Otimização de performance** através da reutilização de eventos
- **Conformidade de segurança** com as políticas do navegador

A arquitetura demonstra como a combinação de tecnologias complementares (JavaScript + eventos CDP) pode resolver problemas complexos de forma elegante, fornecendo poder e conveniência sem comprometer a completude ou a segurança.

================================================
FILE: docs/pt/deep-dive/architecture/event-architecture.md
================================================
# Arquitetura do Sistema de Eventos

Este documento explora a arquitetura interna do sistema de eventos do Pydoll, cobrindo comunicação WebSocket, fluxo de eventos, gerenciamento de callbacks e considerações de performance.

!!! info "Guia de Uso Prático"
    Para exemplos práticos e padrões de uso, consulte o [Guia do Sistema de Eventos](../features/advanced/event-system.md).

## Comunicação WebSocket e CDP

No núcleo do sistema de eventos do Pydoll está o Chrome DevTools Protocol (CDP), que fornece uma maneira estruturada de interagir e monitorar atividades do navegador através de conexões WebSocket. Este canal de comunicação bidirecional permite que seu código tanto envie comandos para o navegador quanto receba eventos de volta.

```mermaid
sequenceDiagram
    participant Client as Código Pydoll
    participant Connection as Manipulador de Conexão
    participant WebSocket
    participant Browser as Navegador
    
    Client->>Connection: Registra callback para evento
    Connection->>Connection: Armazena callback no registro
    
    Client->>Connection: Habilita domínio do evento
    Connection->>WebSocket: Envia comando CDP para habilitar domínio
    WebSocket->>Browser: Encaminha comando
    Browser-->>WebSocket: Confirma domínio habilitado
    WebSocket-->>Connection: Encaminha resposta
    Connection-->>Client: Domínio habilitado
    
    Browser->>WebSocket: Evento ocorre, envia mensagem de evento CDP
    WebSocket->>Connection: Encaminha mensagem de evento
    Connection->>Connection: Procura callbacks para este evento
    Connection->>Client: Executa callback registrado
```

### Modelo de Comunicação WebSocket

A conexão WebSocket entre o Pydoll e o navegador segue este padrão:

1.  **Estabelecimento da Conexão**: Quando o navegador inicia, um servidor WebSocket é criado, e o Pydoll estabelece uma conexão com ele
2.  **Mensagens Bidirecionais**: Tanto o Pydoll quanto o navegador podem enviar mensagens a qualquer momento
3.  **Tipos de Mensagem**:
    -   **Comandos**: Enviados do Pydoll para o navegador (ex: navegação, manipulação do DOM)
    -   **Respostas de Comandos**: Enviadas do navegador para o Pydoll em resposta a comandos
    -   **Eventos**: Enviados do navegador para o Pydoll quando algo acontece (ex: carregamento da página, atividade de rede)

### Estrutura do Chrome DevTools Protocol

O CDP organiza sua funcionalidade em domínios, cada um responsável por uma área específica da funcionalidade do navegador:

| Domínio | Responsabilidade | Eventos Típicos |
|--------|----------------|----------------|
| Page | Ciclo de vida da página | Eventos de carregamento, navegação, diálogos |
| Network | Atividade de rede | Monitoramento de requisição/resposta, WebSockets |
| DOM | Estrutura do documento | Mudanças no DOM, modificações de atributos |
| Fetch | Interceptação de requisição | Requisição pausada, autenticação necessária |
| Runtime | Execução JavaScript | Mensagens do console, exceções |
| Browser | Gerenciamento do navegador | Criação de janelas, abas, contextos |

Cada domínio must ser explicitamente habilitado antes de começar a emitir eventos, o que ajuda a gerenciar a performance processando apenas os eventos que são realmente necessários.

## Arquitetura de Domínio

### O Padrão Habilitar/Desabilitar (Enable/Disable)

O padrão explícito de habilitar/desabilitar atende a vários propósitos arquiteturais importantes:

1.  **Otimização de Performance**: Ao habilitar apenas os domínios nos quais você está interessado, você reduz a sobrecarga (overhead) do processamento de eventos
2.  **Gerenciamento de Recursos**: Alguns domínios de eventos (como monitoramento de Rede ou DOM) podem gerar grandes volumes de eventos que consomem memória
3.  **Conformidade com o Protocolo**: O CDP exige a habilitação explícita do domínio antes que os eventos sejam emitidos
4.  **Limpeza Controlada**: Desabilitar explicitamente os domínios garante uma limpeza adequada quando os eventos não são mais necessários

```mermaid
stateDiagram-v2
    [*] --> Disabled: Estado Inicial
    Disabled --> Enabled: enable_xxx_events()
    Enabled --> Disabled: disable_xxx_events()
    Enabled --> [*]: Aba Fechada
    Disabled --> [*]: Aba Fechada
```

!!! warning "Prevenção de Vazamento de Eventos"
    A falha em desabilitar domínios de eventos quando eles não são mais necessários pode levar a vazamentos de memória e degradação de performance, especialmente em automações de longa duração. Sempre desabilite os domínios de eventos quando terminar de usá-los, particularmente para eventos de alto volume, como monitoramento de rede.

### Métodos de Habilitação Específicos do Domínio

Diferentes domínios são habilitados através de métodos específicos nos objetos apropriados:

| Domínio | Método de Habilitação | Método de Desabilitação | Disponível Em |
|--------|--------------|----------------|--------------|
| Page | `enable_page_events()` | `disable_page_events()` | Aba |
| Network | `enable_network_events()` | `disable_network_events()` | Aba |
| DOM | `enable_dom_events()` | `disable_dom_events()` | Aba |
| Fetch | `enable_fetch_events()` | `disable_fetch_events()` | Aba, Navegador |
| File Chooser | `enable_intercept_file_chooser_dialog()` | `disable_intercept_file_chooser_dialog()` | Aba |

!!! info "Propriedade do Domínio"
    Eventos pertencem a domínios específicos com base em sua funcionalidade. Alguns domínios estão disponíveis apenas em certos níveis - por exemplo, eventos de Página (Page) estão disponíveis na instância da Aba (Tab), mas não diretamente noível do Navegador (Browser).

## Sistema de Registro de Eventos

### O Método `on()`

O método central para se inscrever (subscribing) em eventos é o método `on()`, disponível tanto nas instâncias de Aba (Tab) quanto de Navegador (Browser):

```python
async def on(
    self, event_name: str, callback: callable, temporary: bool = False
) -> int:
    """
    Registra um ouvinte (listener) de evento.

    Args:
        event_name (str): O nome do evento a ser ouvido.
        callback (callable): A função de callback a ser executada quando o
            evento é disparado.
        temporary (bool): Se True, o callback será removido após ser
            disparado uma vez. O padrão é False.

    Returns:
        int: O ID do callback registrado.
    """
```

Este método retorna um ID de callback que pode ser usado para remover o callback posteriormente, se necessário.

### Registro de Callback

Internamente, o `ConnectionHandler` (Manipulador de Conexão) mantém um registro de callbacks:

```python
{
    'Page.loadEventFired': [
        (callback_id_1, callback_function_1, temporary=False),
        (callback_id_2, callback_function_2, temporary=True),
    ],
    'Network.requestWillBeSent': [
        (callback_id_3, callback_function_3, temporary=False),
    ]
}
```

Quando um evento chega via WebSocket:

1.  O nome do evento é extraído da mensagem
2.  O registro é consultado por callbacks correspondentes
3.  Cada callback é executado com os dados do evento
4.  Callbacks temporários são removidos após a execução

### Manipulação de Callback Assíncrono

Callbacks podem ser síncronos ou assíncronos. O sistema de eventos lida com ambos:

```python
async def _trigger_callbacks(self, event_name: str, event_data: dict):
    for cb_id, cb_data in self._event_callbacks.items():
        if cb_data['event'] == event_name:
            if asyncio.iscoroutinefunction(cb_data['callback']):
                await cb_data['callback'](event_data)
            else:
                cb_data['callback'](event_data)
```

Callbacks assíncronos são aguardados (awaited) sequencialmente. Isso significa que cada callback é concluído antes que o próximo seja executado, o que é importante para:

-   **Ordem de Execução Previsível**: Callbacks executam na ordem de registro
-   **Tratamento de Erros**: Exceções em um callback não impedem que outros sejam executados
-   **Consistência de Estado**: Callbacks podem confiar em mudanças de estado sequenciais

!!! info "Execução Sequencial vs. Concorrente"
    Callbacks são executados sequencialmente dentro do mesmo evento. No entanto, eventos diferentes podem ser processados concorrentemente, já que o loop de eventos lida com múltiplas conexões simultaneamente.

## Fluxo e Ciclo de Vida do Evento

O ciclo de vida do evento segue estes passos:

```mermaid
flowchart TD
    A[Atividade do Navegador] -->|Gera| B[Evento CDP]
    B -->|Enviado via WebSocket| C[Manipulador de Conexão]
    C -->|Filtra por Nome de Evento| D{Callbacks Registrados?}
    D -->|Sim| E[Processar Evento]
    D -->|Não| F[Descartar Evento]
    E -->|Para Cada Callback| G[Executar Callback]
    G -->|Se Temporário| H[Remover Callback]
    G -->|Se Permanente| I[Manter para Eventos Futuros]
```

### Fluxo Detalhado

1.  **Atividade do Navegador**: Algo acontece no navegador (página carrega, requisição enviada, DOM muda)
2.  **Geração de Evento CDP**: O navegador gera uma mensagem de evento CDP
3.  **Transmissão WebSocket**: A mensagem é enviada pelo WebSocket para o Pydoll
4.  **Recepção do Evento**: O ConnectionHandler recebe o evento
5.  **Busca de Callback**: O ConnectionHandler verifica seu registro por callbacks que correspondem ao nome do evento
6.  **Execução do Callback**: Se callbacks existirem, cada um é executado com os dados do evento
7.  **Remoção Temporária**: Se um callback foi registrado como temporário, ele é removido após a execução

## Eventos em Nível de Navegador vs. Nível de Aba

O sistema de eventos do Pydoll opera tanto no nível do navegador quanto no nível da aba, com distinções importantes:

```mermaid
graph TD
    Browser[Instância do Navegador] -->|"Eventos Globais (ex: eventos de Target)"| BrowserCallbacks[Callbacks de Nível de Navegador]
    Browser -->|"Cria"| Tab1[Instância de Aba 1]
    Browser -->|"Cria"| Tab2[Instância de Aba 2]
    Tab1 -->|"Eventos Específicos da Aba"| Tab1Callbacks[Callbacks da Aba 1]
    Tab2 -->|"Eventos Específicos da Aba"| Tab2Callbacks[Callbacks da Aba 2]
```

### Eventos em Nível de Navegador

Eventos em nível de navegador operam globalmente em todas as abas. Estes são limitados a domínios específicos como:

-   **Eventos de Alvo (Target)**: Criação, destruição, falha (crash) de abas
-   **Eventos do Navegador**: Gerenciamento de janelas, coordenação de downloads

```python
# Registro de evento em nível de navegador
await browser.on('Target.targetCreated', handle_new_target)
```

Os domínios de eventos em nível de navegador são limitados, e tentar usar eventos específicos de abas levantará uma exceção.

### Eventos em Nível de Aba

Eventos em nível de aba são específicos para uma aba individual:

```python
# Cada aba tem seu próprio contexto de evento
tab1 = await browser.start()
tab2 = await browser.new_tab()

await tab1.enable_page_events()
await tab1.on(PageEvent.LOAD_EVENT_FIRED, handle_tab1_load)

await tab2.enable_page_events()
await tab2.on(PageEvent.LOAD_EVENT_FIRED, handle_tab2_load)
```

Esta arquitetura permite:

-   **Manipulação Isolada de Eventos**: Eventos em uma aba não afetam outras
-   **Configuração por Aba**: Abas diferentes podem monitorar tipos de eventos diferentes
-   **Eficiência de Recursos**: Habilite eventos apenas nas abas que precisam deles

!!! info "Escopo Específico do Domínio"
    Nem todos os domínios de eventos estão disponíveis em ambos os níveis:
    
    -   **Eventos Fetch**: Disponíveis tanto no nível do navegador quanto da aba
    -   **Eventos de Página (Page)**: Disponíveis apenas no nível da aba
    -   **Eventos de Alvo (Target)**: Disponíveis apenas no nível do navegador

## Arquitetura de Performance

### Sobrecarga (Overhead) do Sistema de Eventos

O sistema de eventos adiciona sobrecarga (overhead) à automação do navegador, especialmente para eventos de alta frequência:

| Domínio do Evento | Volume Típico de Eventos | Impacto na Performance |
|--------------|---------------------|-------------------|
| Page | Baixo | Mínimo |
| Network | Alto | Moderado a Alto |
| DOM | Muito Alto | Alto |
| Fetch | Moderado | Moderado (maior se estiver interceptando) |

### Estratégias de Otimização de Performance

1.  **Habilitação Seletiva de Domínio**: Apenas habilite domínios de eventos que você está usando ativamente
2.  **Definição Estratégica de Escopo**: Use eventos em nível de navegador apenas para preocupações que sejam verdadeiramente globais
3.  **Desabilitação Oportuna**: Sempre desabilite os domínios de eventos quando terminar de usá-los
4.  **Filtragem Precoce**: Nos callbacks, filtre eventos irrelevantes o mais cedo possível
5.  **Callbacks Temporários**: Use a flag `temporary=True` para eventos de ocorrência única

### Gerenciamento de Memória

O sistema de eventos gerencia a memória através de vários mecanismos:

1.  **Limpeza do Registro de Callbacks**: Remover callbacks libera suas referências
2.  **Auto-Remoção Temporária**: Callbacks temporários são limpos automaticamente
3.  **Desabilitação de Domínio**: Desabilitar um domínio interrompe a geração de eventos
4.  **Fechamento da Aba**: Quando uma aba fecha, todos os seus callbacks são removidos automaticamente

!!! warning "Prevenção de Vazamento de Memória"
    Em automações de longa duração, sempre limpe os callbacks e desabilite os domínios quando terminar. Eventos de alta frequência (especialmente DOM) podem acumular memória significativa se deixados habilitados.

## Arquitetura do Manipulador de Conexão (Connection Handler)

O `ConnectionHandler` é o componente central que gerencia a comunicação WebSocket e o despacho de eventos.

### Principais Responsabilidades

1.  **Gerenciamento de WebSocket**: Estabelecer e manter a conexão WebSocket
2.  **Roteamento de Mensagens**: Distinguir entre respostas de comandos e eventos
3.  **Registro de Callbacks**: Manter o mapeamento de nomes de eventos para callbacks
4.  **Despacho de Eventos**: Executar callbacks registrados quando os eventos chegam
5.  **Limpeza**: Remover callbacks e fechar conexões

### Estrutura Interna

```python
class ConnectionHandler:
    def __init__(self, ...):
        self._events_handler = EventsManager()
        self._websocket = None
        # ... outros atributos
    
    async def register_callback(self, event_name, callback, temporary):
        return self._events_handler.register_callback(event_name, callback, temporary)

class EventsManager:
    def __init__(self):
        self._event_callbacks = {}  # ID do Callback -> dados do callback
        self._callback_id = 0
    
    def register_callback(self, event_name, callback, temporary):
        self._callback_id += 1
        self._event_callbacks[self._callback_id] = {
            'event': event_name,
            'callback': callback,
            'temporary': temporary
        }
        return self._callback_id
    
    async def _trigger_callbacks(self, event_name, event_data):
        callbacks_to_remove = []
        
        for cb_id, cb_data in self._event_callbacks.items():
            if cb_data['event'] == event_name:
                # Executa callback (await se assíncrono, chama diretamente se síncrono)
                if asyncio.iscoroutinefunction(cb_data['callback']):
                    await cb_data['callback'](event_data)
                else:
                    cb_data['callback'](event_data)
                
                # Marca callbacks temporários para remoção
                if cb_data['temporary']:
                    callbacks_to_remove.append(cb_id)
        
        # Remove callbacks temporários após todos os callbacks serem executados
        for cb_id in callbacks_to_remove:
            self.remove_callback(cb_id)
```

Esta arquitetura garante:

-   **Busca Eficiente**: Nomes de eventos mapeiam diretamente para listas de callbacks
-   **Sobrecarga Mínima**: Apenas eventos registrados são processados
-   **Limpeza Automática**: Callbacks temporários são removidos após a execução
-   **Segurança Assíncrona (Async-safe)**: Operações são seguras em ambientes assíncronos

## Formato da Mensagem de Evento

Eventos CDP seguem um formato de mensagem padronizado:

```json
{
    "method": "Network.requestWillBeSent",
    "params": {
        "requestId": "1234.56",
        "loaderId": "7890.12",
        "documentURL": "https://example.com",
        "request": {
            "url": "https://api.example.com/data",
            "method": "GET",
            "headers": {...}
        },
        "timestamp": 123456.789,
        "wallTime": 1234567890.123,
        "initiator": {...},
        "type": "XHR"
    }
}
```

Componentes principais:

-   **`method`**: O nome do evento no formato `Dominio.nomeDoEvento`
-   **`params`**: Dados específicos do evento, variam por tipo de evento
-   **Sem campo `id`**: Diferente dos comandos, eventos não têm IDs de requisição

O sistema de eventos extrai o campo `method` para rotear para os callbacks apropriados, passando a mensagem inteira para cada callback.

## Coordenação de Eventos Multi-Aba

A arquitetura do Pydoll suporta coordenação sofisticada de eventos multi-aba:

### Contextos de Aba Independentes

Cada aba mantém seus próprios:

-   Estado de habilitação de domínio de evento
-   Registro de callbacks
-   Canal de comunicação de evento
-   Logs de rede (se eventos de rede estiverem habilitados)

!!! info "Arquitetura de Comunicação"
    Cada aba tem seu próprio canal de comunicação de eventos para o navegador. Para detalhes técnicos sobre como conexões WebSocket e IDs de alvo (target) funcionam no nível do protocolo, consulte [Arquitetura do Domínio do Navegador](./browser-domain.md).

### Contexto de Navegador Compartilhado

Múltiplas abas podem compartilhar:

-   Ouvintes de eventos em nível de navegador
-   Armazenamento de cookies
-   Cache
-   Processo do navegador

Esta arquitetura permite:

1.  **Processamento Paralelo de Eventos**: Múltiplas abas podem processar eventos simultaneamente
2.  **Falhas Isoladas**: Problemas em uma aba não afetam outras
3.  **Compartilhamento de Recursos**: Recursos comuns do navegador são compartilhados eficientemente
4.  **Ações Coordenadas**: Eventos em nível de navegador podem coordenar atividades entre abas

## Conclusão

A arquitetura do sistema de eventos do Pydoll é projetada para:

-   **Performance**: Sobrecarga mínima através de habilitação seletiva de domínio e despacho eficiente de callbacks
-   **Flexibilidade**: Suporte para eventos tanto em nível de navegador quanto de aba
-   **Escalabilidade**: Lidar com múltiplas abas com contextos de eventos independentes
-   **Confiabilidade**: Limpeza automática e gerenciamento de memória

Entender esta arquitetura ajuda você a:

-   **Otimizar Performance**: Saber quais domínios têm alta sobrecarga
-   **Depurar Problemas**: Entender o fluxo de eventos quando as coisas não funcionam como esperado
-   **Projetar Automação Melhor**: Alavancar a arquitetura para fluxos de trabalho eficientes orientados a eventos
-   **Evitar Armadilhas**: Prevenir vazamentos de memória e degradação de performance

Para padrões de uso práticos e exemplos, consulte o [Guia do Sistema de Eventos](../features/advanced/event-system.md).

================================================
FILE: docs/pt/deep-dive/architecture/find-elements-mixin.md
================================================
# Arquitetura do Mixin FindElements

O FindElementsMixin representa uma decisão arquitetural crítica no Pydoll: usar **composição sobre herança** para compartilhar capacidades de localização de elementos entre `Tab` e `WebElement` sem acoplá-los através de uma classe base comum. Este documento explora o padrão mixin, sua implementação e a mecânica interna de localização de elementos.

!!! info "Guia de Uso Prático"
    Para exemplos práticos e padrões de uso, consulte o [Guia de Localização de Elementos](../features/automation/element-finding.md) e o [Guia de Seletores](./selectors-guide.md).

## Padrão Mixin: Filosofia de Design

### O que é um Mixin?

Um mixin é uma classe projetada para **fornecer métodos a outras classes** sem ser uma classe base em uma hierarquia de herança tradicional. Diferente da herança padrão (que modela relações "é-um" (is-a)), mixins modelam **capacidades "pode-fazer" (can-do)**.

```python
# Herança tradicional: "é-um" (is-a)
class Animal:
    def breathe(self): ...

class Dog(Animal):  # Dog É-UM Animal
    def bark(self): ...

# Padrão Mixin: "pode-fazer" (can-do)
class FlyableMixin:
    def fly(self): ...

class Bird(Animal, FlyableMixin):  # Bird É-UM Animal, PODE voar
    pass
```

### Por que Mixins em vez de Herança?

O Pydoll enfrenta um desafio arquitetural específico:

- **`Tab`** precisa encontrar elementos no **contexto do documento**
- **`WebElement`** precisa encontrar elementos **relativos a si mesmo** (elementos filhos)
- Ambos precisam de **lógica de seletor idêntica** (CSS, XPath, construção de atributos)

**Opção 1: Classe Base Compartilhada**

```python
class ElementLocator:
    def find(...): ...

class Tab(ElementLocator):
    pass

class WebElement(ElementLocator):
    pass
```

**Problemas:**
- Alto acoplamento: `Tab` e `WebElement` agora compartilham a hierarquia de herança
- Viola a Responsabilidade Única: `Tab` não deveria herdar da mesma classe que `WebElement`
- Difícil de estender: Adicionar novas capacidades requer modificar a classe base

**Opção 2: Padrão Mixin (Abordagem Escolhida)**

```python
class FindElementsMixin:
    def find(...): ...
    def query(...): ...

class Tab(FindElementsMixin):
    # Lógica específica do Tab
    pass

class WebElement(FindElementsMixin):
    # Lógica específica do WebElement
    pass
```

**Benefícios:**

- **Desacoplamento**: `Tab` e `WebElement` permanecem independentes
- **Reutilização**: Mesma lógica de localização de elementos em ambas as classes
- **Componibilidade**: Pode adicionar outros mixins sem conflitos
- **Testabilidade**: O Mixin pode ser testado isoladamente

!!! tip "Características do Mixin"
    1. **Sem Estado (Stateless)**: Mixins não mantêm seu próprio estado (sem `__init__`)
    2. **Injeção de Dependência**: Assume que a classe consumidora fornece dependências (ex: `_connection_handler`)
    3. **Propósito Único**: Cada mixin fornece uma capacidade coesa
    4. **Não Instanciável**: Nunca crie `FindElementsMixin()` diretamente

## Implementação do Mixin no Pydoll

### Estrutura da Classe

O FindElementsMixin usa **injeção de dependência** para funcionar com qualquer classe que forneça um `_connection_handler`:

```python
class FindElementsMixin:
    """
    Mixin que fornece capacidades de localização de elementos.
    
    Assume que a classe consumidora possui:
    - _connection_handler: Instância de ConnectionHandler para comandos CDP
    - _object_id: Optional[str] para buscas relativas ao contexto (apenas WebElement)
    """
    
    if TYPE_CHECKING:
        _connection_handler: ConnectionHandler  # Dica de tipo (type hint), não um atributo real
    
    async def find(self, ...):
        # Implementação usa self._connection_handler
        # Verifica self._object_id para determinar o contexto
```

**Insight principal:** O mixin não define `_connection_handler` ou `_object_id`. Ele **assume** que eles existem via duck typing.

### Como Tab e WebElement Usam o Mixin

```python
# Tab: buscas em nível de documento
class Tab(FindElementsMixin):
    def __init__(self, browser, target_id, connection_port):
        self._connection_handler = ConnectionHandler(connection_port)
        # Sem _object_id → busca a partir da raiz do documento

# WebElement: buscas relativas ao elemento
class WebElement(FindElementsMixin):
    def __init__(self, object_id, connection_handler, ...):
        self._object_id = object_id  # ID do objeto CDP
        self._connection_handler = connection_handler
        # Tem _object_id → busca relativa a este elemento
```

**Distinção crítica:**

- **Tab**: `hasattr(self, '_object_id')` → `False` → usa `RuntimeCommands.evaluate()` (contexto do documento)
- **WebElement**: `hasattr(self, '_object_id')` → `True` → usa `RuntimeCommands.call_function_on()` (contexto do elemento)

### Detecção de Contexto

O mixin detecta dinamicamente o contexto da busca:

```python
async def _find_element(self, by, value, raise_exc=True):
    if hasattr(self, '_object_id'):
        # Busca relativa: chama a função JavaScript NESTE elemento
        command = self._get_find_element_command(by, value, self._object_id)
    else:
        # Busca no documento: avalia o JavaScript no contexto global
        command = self._get_find_element_command(by, value)
    
    response = await self._execute_command(command)
    # ...
```

Esta implementação única lida com ambos:

- `tab.find(id='submit')` → busca no documento inteiro
- `form_element.find(id='submit')` → busca dentro do `form_element`

!!! warning "Acoplamento de Dependência do Mixin"
    O mixin é **fortemente acoplado** ao modelo de objeto do CDP. Ele assume que:
    
    - Elementos são representados por strings `objectId`
    - `Runtime.evaluate()` para buscas no documento
    - `Runtime.callFunctionOn()` para buscas relativas a elementos
    
    Isso é aceitável porque o Pydoll é **específico do CDP**. Um design mais genérico exigiria camadas de abstração.

## Design da API Pública

O mixin expõe dois métodos de alto nível com filosofias de design distintas:

### find(): Seleção Baseada em Atributos

```python
@overload
async def find(self, find_all: Literal[False], ...) -> WebElement: ...

@overload
async def find(self, find_all: Literal[True], ...) -> list[WebElement]: ...

async def find(
    self,
    id: Optional[str] = None,
    class_name: Optional[str] = None,
    name: Optional[str] = None,
    tag_name: Optional[str] = None,
    text: Optional[str] = None,
    timeout: int = 0,
    find_all: bool = False,
    raise_exc: bool = True,
    **attributes,
) -> Union[WebElement, list[WebElement], None]:
```

**Decisões de design:**

1. **Kwargs (argumentos nomeados) em vez de Enum By posicional**:
   ```python
   # Pydoll (intuitivo)
   await tab.find(id='submit', class_name='primary')
   
   # Selenium (verboso)
   driver.find_element(By.ID, 'submit')  # Não pode combinar atributos facilmente
   ```

2. **Resolução automática para o seletor ideal**:
   - Atributo único → usa `By.ID`, `By.CLASS_NAME`, etc. (mais rápido)
   - Múltiplos atributos → constrói XPath (flexível, mas mais lento)

3. **`**attributes` para extensibilidade**:
   ```python
   await tab.find(data_testid='submit-btn', aria_label='Submit form')
   # Constrói: //\*[@data-testid='submit-btn' and @aria-label='Submit form']
   ```

### query(): Seleção Baseada em Expressão

```python
@overload
async def query(self, expression, find_all: Literal[False], ...) -> WebElement: ...

@overload
async def query(self, expression, find_all: Literal[True], ...) -> list[WebElement]: ...

async def query(
    self, 
    expression: str, 
    timeout: int = 0, 
    find_all: bool = False, 
    raise_exc: bool = True
) -> Union[WebElement, list[WebElement], None]:
```

**Decisões de design:**

1. **Detecção automática de CSS vs XPath**:
   ```python
   # Detecção de XPath (começa com / ou ./)
   await tab.query("//div[@id='content']")
   
   # Detecção de CSS (padrão)
   await tab.query("div#content > p.intro")
   ```

2. **Parâmetro de expressão única** (diferente do `find()`):
   - Assume que o usuário conhece a sintaxe do seletor
   - Sem sobrecarga de abstração

3. **Passagem direta (passthrough) para o navegador**:
   - `querySelector()` / `querySelectorAll()` para CSS
   - `document.evaluate()` para XPath

### Padrão de Sobrecarga (Overload) para Segurança de Tipos

Ambos os métodos usam `@overload` para fornecer **tipos de retorno precisos**:

```python
# A IDE sabe que o tipo de retorno é WebElement
element = await tab.find(id='submit')

# A IDE sabe que o tipo de retorno é list[WebElement]
elements = await tab.find(class_name='item', find_all=True)

# A IDE sabe que o tipo de retorno é Optional[WebElement]
maybe_element = await tab.find(id='optional', raise_exc=False)
```

Isso é crítico para o autocomplete da IDE e verificação de tipos. Veja [Análise Profunda do Sistema de Tipos](./typing-system.md) para detalhes.

## Arquitetura de Resolução de Seletor

O mixin converte a entrada do usuário em comandos CDP através de um pipeline de resolução:

| Estágio | Entrada | Saída | Decisão Chave |
|-------|-------|--------|-------------|
| **1. Seleção de Método** | `find()` kwargs ou `query()` expressão | Estratégia de seletor | Baseado em atributo vs. baseado em expressão |
| **2. Resolução da Estratégia** | Atributos ou expressão | Enum `By` + valor | Atributo único → método nativo, Múltiplos → XPath |
| **3. Detecção de Contexto** | `By` + valor + `hasattr(_object_id)` | Tipo de comando CDP | Documento vs. busca relativa ao elemento |
| **4. Geração do Comando** | Tipo de comando CDP + seletor | JavaScript + método CDP | `evaluate()` vs `callFunctionOn()` |
| **5. Execução** | Comando CDP | `objectId` ou array de `objectId`s | Via ConnectionHandler |
| **6. Criação do WebElement** | `objectId` + atributos | Instância(s) de `WebElement` | Função de fábrica (factory) para evitar importações circulares |

### Principais Decisões Arquiteturais

**1. Atributos Únicos vs. Múltiplos**

```python
# Atributo único → Seletor direto (rápido)
await tab.find(id='username')  # Usa By.ID → getElementById()

# Múltiplos atributos → XPath (flexível)
await tab.find(tag_name='input', type='password', name='pwd')
# → //input[@type='password' and @name='pwd']
```

**Por que isso importa:**
- Métodos nativos (`getElementById`, `getElementsByClassName`) são 10-50% mais rápidos que XPath
- A sobrecarga do XPath é aceitável ao combinar atributos (não há alternativa)

**2. Detecção Automática do Tipo de Seletor**

```python
await tab.query("//div")       # Começa com / → XPath
await tab.query("#login")      # Padrão → CSS
```

**Implementação:**
```python
if expression.startswith(('./', '/', '(/')):
    return By.XPATH
return By.CSS_SELECTOR
```

A heurística é **inequívoca** - seletores CSS não podem começar com `/`.

**3. Ajuste de Caminho Relativo do XPath**

Para buscas relativas a elementos, o XPath absoluto deve ser convertido:

```python
# Usuário fornece: //div
# Para WebElement: .//div (relativo ao elemento, não ao documento)

def _ensure_relative_xpath(xpath):
    return f'.{xpath}' if not xpath.startswith('.') else xpath
```

Sem isso, `element.find()` buscaria a partir da raiz do documento.

## Geração de Comando CDP

O mixin roteia para diferentes métodos CDP com base no contexto da busca:

| Contexto | Tipo de Seletor | Método CDP | Equivalente JavaScript |
|---------|--------------|------------|---------------------|
| Documento | CSS | `Runtime.evaluate` | `document.querySelector()` |
| Documento | XPath | `Runtime.evaluate` | `document.evaluate()` |
| Elemento | CSS | `Runtime.callFunctionOn` | `this.querySelector()` |
| Elemento | XPath | `Runtime.callFunctionOn` | `document.evaluate(..., this)` |

**Insight principal:** `Runtime.callFunctionOn` requer um `objectId` (o elemento no qual a função será chamada), enquanto `Runtime.evaluate` executa no escopo global.

### Modelos (Templates) JavaScript

O Pydoll usa modelos pré-definidos para consistência e performance:

```python
# Seletores CSS
Scripts.QUERY_SELECTOR = 'document.querySelector("{selector}")'
Scripts.RELATIVE_QUERY_SELECTOR = 'this.querySelector("{selector}")'

# Expressões XPath
Scripts.FIND_XPATH_ELEMENT = '''
    document.evaluate("{escaped_value}", document, null,
                      XPathResult.FIRST_ORDERED_NODE_TYPE, null).singleNodeValue
'''
```

Modelos evitam concatenação de strings em tempo de execução e centralizam o código JavaScript.

## Resolução de ObjectID e Criação de WebElement

O CDP representa nós DOM como **strings `objectId`**. O mixin abstrai isso:

**Fluxo de elemento único:**
1. Executar comando CDP → Extrair `objectId` da resposta
2. Chamar `DOM.describeNode(objectId)` → Obter atributos, nome da tag
3. Criar `WebElement(objectId, connection_handler, attributes)`

**Fluxo de múltiplos elementos:**
1. Executar comando CDP → Retorna **array como um único objeto remoto**
2. Chamar `Runtime.getProperties(array_objectId)` → Enumerar índices do array
3. Extrair `objectId` individual para cada elemento
4. Descrever e criar `WebElement` para cada

**Por que `Runtime.getProperties`?** O CDP não retorna arrays diretamente - ele retorna uma **referência a um objeto array**. Devemos enumerar suas propriedades para extrair os elementos individuais.

## Insights Arquiteturais e Tradeoffs de Design

### Por que Kwargs em vez de Enum By?

**A escolha do Pydoll:**
```python
await tab.find(id='submit', class_name='primary')
```

**A abordagem do Selenium:**
```python
driver.find_element(By.ID, 'submit')  # Não pode combinar atributos
```

**Justificativa:**

- **Descoberta (Discoverability)**: O autocomplete da IDE mostra todos os parâmetros disponíveis
- **Componibilidade**: Pode combinar múltiplos atributos em uma chamada
- **Legibilidade**: `id='submit'` é mais intuitivo do que `(By.ID, 'submit')`

**Tradeoff:** Kwargs são menos explícitos sobre a estratégia do seletor. Resolvido com documentação e logs.

### Por que Detectar Automaticamente CSS vs. XPath?

A heurística `_get_expression_type()` elimina o fardo do usuário:

```python
await tab.query("//div")       # Auto: XPath
await tab.query("#login")      # Auto: CSS
await tab.query("div > p")     # Auto: CSS
```

**Benefícios:**

- **Ergonomia**: Usuários não precisam especificar o tipo de seletor
- **Correção**: Impossível usar incorretamente (XPath com método CSS, vice-versa)

**Limitação:** Nenhuma maneira de forçar a interpretação de CSS para seletores ambíguos (caso extremo raro).

### Prevenção de Importação Circular: create_web_element()

O mixin usa uma **função de fábrica (factory function)** para evitar importações circulares:

```python
def create_web_element(*args, **kwargs):
    """Importa WebElement dinamicamente em tempo de execução."""
    from pydoll.elements.web_element import WebElement  # Importação tardia
    return WebElement(*args, **kwargs)
```

**Por que é necessário?**

- `FindElementsMixin` → precisa criar `WebElement`
- `WebElement` → herda de `FindElementsMixin`
- Dependência circular!

**Solução:** Importação tardia (late import) dentro da função de fábrica. A importação só é executada quando a função é chamada, quebrando o ciclo.

### hasattr() para Detecção de Contexto: Elegante ou Hacky?

O mixin usa `hasattr(self, '_object_id')` para detectar Tab vs WebElement:

```python
if hasattr(self, '_object_id'):
    # WebElement: busca relativa ao elemento
else:
    # Tab: busca em nível de documento
```

**Isso é "hacky" (gambiarra)?**

- **Não**: É **duck typing** (um idioma Pythônico)
- O Mixin não precisa saber a hierarquia de classes
- Tanto Tab quanto WebElement fornecem `_connection_handler`
- WebElement adicionalmente fornece `_object_id`

**Abordagens alternativas:**

1. **Verificação de tipo**: `if isinstance(self, WebElement)` → Acopla o mixin ao WebElement
2. **Método abstrato**: Exigiria que Tab/WebElement implementassem `get_search_context()` → Mais código boilerplate
3. **Injeção de dependência**: Passar o contexto como parâmetro → Quebra a ergonomia da API

**Veredito:** `hasattr()` é a melhor solução para este caso de uso.

## Principais Conclusões

1. **Mixins permitem o compartilhamento de código** sem acoplar `Tab` e `WebElement` através de herança
2. **Detecção de contexto via duck typing** (`hasattr`) mantém o mixin desacoplado da hierarquia de classes
3. **Resolução automática otimiza a performance** usando métodos nativos para atributos únicos
4. **Construção de XPath fornece componibilidade** para consultas com múltiplos atributos
5. **Espera baseada em polling (sondagem) é simples**, mas troca ciclos de CPU por simplicidade de implementação
6. **Complexidade do modelo de objeto CDP** é escondida atrás da abstração do WebElement
7. **Segurança de tipos via sobrecargas (overloads)** fornece tipos de retorno precisos para suporte da IDE

## Documentação Relacionada

Para um entendimento mais profundo dos componentes arquiteturais relacionados:

- **[Sistema de Tipos](./typing-system.md)**: Padrão Overload, TypedDict, tipos Genéricos
- **[Domínio do WebElement](./webelement-domain.md)**: Arquitetura do WebElement e métodos de interação
- **[Guia de Seletores](./selectors-guide.md)**: Sintaxe e boas práticas de CSS vs XPath
- **[Domínio da Tab](./tab-domain.md)**: Operações em nível de aba e gerenciamento de contexto

Para padrões de uso prático:

- **[Guia de Localização de Elementos](../features/automation/element-finding.md)**: Exemplos práticos e padrões
- **[Interações Humanizadas](../features/automation/human-interactions.md)**: Interação realista com elementos

================================================
FILE: docs/pt/deep-dive/architecture/index.md
================================================
# Arquitetura Interna

**Entenda o design, depois quebre as regras intencionalmente.**

A maioria da documentação mostra **o que** um framework faz. Esta seção revela **como** e **por que** o Pydoll é arquitetado da maneira que é: os padrões de design, as decisões arquiteturais e os tradeoffs (compromissos) que moldam cada linha de código.

## Por que a Arquitetura Importa

Você pode usar o Pydoll eficazmente sem entender sua arquitetura interna. Mas quando você precisar:

- **Depurar** problemas complexos que abrangem múltiplos componentes
- **Otimizar** gargalos de performance em automação de grande escala
- **Estender** o Pydoll com funcionalidade personalizada
- **Contribuir** com melhorias para a base de código
- **Construir** ferramentas similares para diferentes casos de uso

...o conhecimento arquitetural se torna **indispensável**.

!!! quote "Arquitetura como Linguagem"
    **"Arquitetura é música congelada."** - Johann Wolfgang von Goethe
    
    Uma boa arquitetura não é apenas sobre fazer o código funcionar, é sobre tornar o código **compreensível**, **manutenível** e **extensível**. Entender a arquitetura do Pydoll ensina padrões que você aplicará em todos os projetos.

## Os Seis Domínios Arquiteturais

A arquitetura do Pydoll é organizada em **seis domínios coesos**, cada um com responsabilidades e interfaces claras:

### 1. Domínio do Navegador (Browser)
**[→ Explore a Arquitetura do Navegador](./browser-domain.md)**

**O orquestrador: gerenciando processos, contextos e estado global.**

O domínio do Navegador (Browser) fica no topo da hierarquia, coordenando:

- **Gerenciamento de processos**: Iniciar/terminar executáveis do navegador
- **Contextos do navegador**: Ambientes isolados (como janelas anônimas)
- **Registro de abas**: Padrão Singleton para instâncias de Abas (Tab)
- **Autenticação de proxy**: Autenticação automática via domínio Fetch
- **Operações globais**: Downloads, permissões, gerenciamento de janelas

**Principais padrões arquiteturais**:

- **Classe base abstrata** para Chrome/Edge/outros navegadores Chromium
- **Padrão Gerenciador (Manager)** (ProcessManager, ProxyManager, TempDirManager)
- **Registro Singleton** para instâncias de Aba (previne duplicatas)
- **Protocolo de gerenciador de contexto** para limpeza automática

**Insight crítico**: O Navegador não manipula páginas diretamente, ele **coordena** componentes de nível inferior. Essa separação de responsabilidades permite suporte a múltiplos navegadores e operações concorrentes em abas.

---

### 2. Domínio da Aba (Tab)
**[→ Explore a Arquitetura da Aba](./tab-domain.md)**

**O cavalo de batalha: executando comandos, gerenciando estado, coordenando automação.**

O domínio da Aba (Tab) é a interface primária do Pydoll, lidando com:

- **Navegação**: Carregamento de página com estados de espera configuráveis
- **Localização de elementos**: Delegado ao FindElementsMixin
- **Execução de JavaScript**: Contextos tanto de página quanto de elemento
- **Coordenação de eventos**: Ouvintes (listeners) de eventos específicos da aba
- **Monitoramento de rede**: Captura e análise de requisição/resposta
- **Manipulação de IFrame**: Gerenciamento de contexto aninhado

**Principais padrões arquiteturais**:

- **Padrão Façade (Fachada)**: Interface simplificada para operações complexas do CDP
- **Composição de Mixin**: FindElementsMixin para localização de elementos
- **WebSocket por aba**: Conexões independentes para paralelismo
- **Flags de estado**: Rastreia domínios habilitados (network_events_enabled, etc.)
- **Inicialização preguiçosa (Lazy)**: Objeto Request criado no primeiro acesso

**Insight crítico**: Cada Aba (Tab) possui seu **próprio ConnectionHandler**, permitindo operações paralelas verdadeiras entre abas sem contenção ou vazamento de estado.

---

### 3. Domínio do WebElement
**[→ Explore a Arquitetura do WebElement](./webelement-domain.md)**

**O interator: fazendo a ponte entre código Python e elementos DOM.**

O domínio WebElement representa **elementos DOM individuais**, fornecendo:

- **Métodos de interação**: Clique, digitação, rolagem, seleção
- **Acesso a propriedades**: Texto, HTML, limites (bounds), atributos
- **Consultas de estado**: Visibilidade, status de habilitado, valor
- **Capturas de tela (Screenshots)**: Captura de imagem específica do elemento
- **Localização de filhos**: Localização de elementos relativos (também via FindElementsMixin)

**Principais padrões arquiteturais**:

- **Padrão Proxy**: Objeto Python representando um elemento remoto do navegador
- **Abstração de Object ID**: O objectId do CDP oculto atrás da API Python
- **Propriedades híbridas**: Síncronas (atributos) vs. assíncronas (estado dinâmico)
- **Padrão Command**: Métodos de interação encapsulam comandos CDP
- **Estratégias de fallback**: Múltiplas abordagens para robustez

**Insight crítico**: O WebElement mantém **ambos os atributos em cache** (da criação) e **estado dinâmico** (buscado sob demanda), equilibrando performance com dados atualizados.

---

### 4. Mixin FindElements
**[→ Explore a Arquitetura do FindElements](./find-elements-mixin.md)**

**O localizador: traduzindo seletores em consultas DOM.**

O FindElementsMixin fornece capacidades de localização de elementos tanto para a Aba (Tab) quanto para o WebElement através de **composição**, não herança:

- **Localização baseada em atributos**: `find(id='submit', class_name='btn')`
- **Consulta baseada em expressão**: `query('div.container > p')`
- **Resolução de estratégia**: Seletor ideal para atributos únicos vs. múltiplos
- **Mecanismos de espera**: Polling (sondagem) com timeouts configuráveis
- **Detecção de contexto**: Buscas no documento vs. relativas ao elemento

**Principais padrões arquiteturais**:
- **Padrão Mixin**: Capacidade compartilhada sem hierarquia de herança
- **Padrão Strategy**: Diferentes estratégias de seletor baseadas na entrada
- **Padrão Template Method**: Fluxo comum, implementação específica da estratégia
- **Função de Fábrica (Factory)**: Importação tardia (late import) para evitar dependências circulares
- **Padrão Overload**: Tipos de retorno seguros (WebElement vs. lista)

**Insight crítico**: O mixin usa **duck typing** (`hasattr(self, '_object_id')`) para detectar Tab vs. WebElement, permitindo reuso de código sem acoplamento forte.

---

### 5. Arquitetura de Eventos
**[→ Explore a Arquitetura de Eventos](./event-architecture.md)**

**O despachante: roteando eventos do navegador para callbacks Python.**

A Arquitetura de Eventos permite automação reativa através de:

- **Registro de eventos**: Método `on()` para se inscrever (subscribe) em eventos CDP
- **Despacho de callbacks**: Execução assíncrona sem bloqueio
- **Gerenciamento de domínio**: Habilitação/desabilitação explícita para performance
- **Callbacks temporários**: Auto-remoção após a primeira invocação
- **Escopo multi-nível**: Eventos em todo o navegador vs. específicos da aba

**Principais padrões arquiteturais**:

- **Padrão Observer**: Inscrever/notificar para código orientado a eventos
- **Padrão Registry**: Mapeamento de nome do evento → lista de callbacks
- **Padrão Wrapper**: Encapsula callbacks síncronos para execução assíncrona
- **Protocolo de limpeza**: Remoção automática de callbacks no fechamento da aba
- **Isolamento de escopo**: Contextos de eventos independentes por aba

**Insight crítico**: Eventos são baseados em **push** (navegador notifica o Python), não em poll (sondagem), permitindo automação reativa de baixa latência sem espera ocupada (busy-waiting).

---

### 6. Arquitetura de Requisições do Navegador
**[→ Explore a Arquitetura de Requisições](./browser-requests-architecture.md)**

**O híbrido: requisições HTTP com o estado de sessão do navegador.**

O sistema de Requisições do Navegador (Browser Requests) faz a ponte entre HTTP e automação de navegador:

- **Continuidade de sessão**: Cookies e autenticação incluídos automaticamente
- **Fontes de dados duplas**: API Fetch do JavaScript + eventos de rede do CDP
- **Metadados completos**: Cabeçalhos, cookies, tempo (timing) (nem tudo disponível via JavaScript)
- **API semelhante à `requests`**: Interface familiar com o poder do navegador

**Principais padrões arquiteturais**:

- **Execução híbrida**: JavaScript para o corpo (body), CDP para metadados
- **Registro temporário de eventos**: Padrão Habilitar/capturar/desabilitar
- **Inicialização preguiçosa (lazy) de propriedade**: Objeto Request criado no primeiro uso
- **Padrão Adapter**: Interface compatível com `requests` para o fetch do navegador

**Insight crítico**: As requisições do navegador combinam **duas fontes de informação** (JavaScript e eventos CDP). O JavaScript fornece o corpo da resposta, o CDP fornece cabeçalhos e cookies que as políticas de segurança do JavaScript ocultam.

---

## Princípios Arquiteturais

Esses seis domínios seguem princípios consistentes:

### 1. Separação de Responsabilidades (Separation of Concerns)
Cada domínio tem uma **responsabilidade única e bem definida**:

- Navegador → Gerenciamento de processo/contexto
- Aba → Execução de comando e estado
- WebElement → Interação com elemento
- FindElements → Localização de elemento
- Eventos → Despacho reativo
- Requisições → HTTP no contexto do navegador

**Benefício**: Mudanças em um domínio raramente exigem mudanças em outros.

### 2. Composição Sobre Herança
Em vez de hierarquias de herança profundas, o Pydoll usa:

- **Mixins** (FindElementsMixin compartilhado por Tab e WebElement)
- **Gerenciadores (Managers)** (ProcessManager, ProxyManager, TempDirManager)
- **Injeção de dependência** (ConnectionHandler passado para os componentes)

**Benefício**: Reutilização flexível de componentes sem acoplamento forte.

### 3. Assíncrono por Padrão (Async by Default)
Todas as operações de E/S (I/O) são `async def` e devem ser `await`ed:

- Comunicação WebSocket
- Execução de comando CDP
- Despacho de callback de evento
- Requisições de rede

**Benefício**: Permite concorrência verdadeira com múltiplas abas, operações paralelas e E/S não bloqueante.

### 4. Segurança de Tipos (Type Safety)
Toda API pública tem anotações de tipo (type annotations):

- Parâmetros de função e tipos de retorno
- Respostas CDP como `TypedDict`
- Tipos de eventos para parâmetros de callback
- Sobrecargas (Overloads) para métodos polimórficos

**Benefício**: Autocomplete da IDE, verificação estática de tipos, código autodocumentado.

### 5. Gerenciamento de Recursos
Gerenciadores de contexto garantem a limpeza:

- `async with Browser()` → fecha o navegador ao sair
- `async with tab.expect_file_chooser()` → desabilita o interceptador
- `async with tab.expect_download()` → limpa arquivos temporários

**Benefício**: Limpeza automática de recursos, previne vazamentos mesmo em exceções.

## Interação de Componentes

Entender como os domínios interagem é fundamental:

```mermaid
graph TB
    User[Seu Código Python]
    
    User --> Browser[Domínio do Navegador]
    User --> Tab[Domínio da Aba]
    User --> Element[Domínio do WebElement]
    
    Browser --> ProcessMgr[Gerenciador de Processo]
    Browser --> ContextMgr[Gerenciador de Contexto]
    Browser --> TabRegistry[Registro de Abas]
    
    Tab --> ConnHandler[Manipulador de Conexão]
    Tab --> FindMixin[Mixin FindElements]
    Tab --> EventSystem[Sistema de Eventos]
    Tab --> RequestSystem[Sistema de Requisições]
    
    Element --> ConnHandler2[Manipulador de Conexão]
    Element --> FindMixin2[Mixin FindElements]
    
    ConnHandler --> WebSocket[WebSocket para CDP]
    ConnHandler2 --> WebSocket
    EventSystem --> ConnHandler
    RequestSystem --> ConnHandler
    RequestSystem --> EventSystem
    
    WebSocket --> Chrome[Navegador Chrome]
```

**Principais interações**:

1. **Navegador cria Abas** → Abas armazenadas no registro
2. **Aba e WebElement usam FindElementsMixin** → Localização de elementos compartilhada
3. **Cada Aba possui um ConnectionHandler** → Conexões WebSocket independentes
4. **Sistema de requisições usa Sistema de eventos** → Eventos de rede capturam metadados
5. **Todos os componentes usam ConnectionHandler** → Comunicação CDP centralizada

## Pré-requisitos

Para se beneficiar totalmente desta seção:

- **[Fundamentos Essenciais](../fundamentals/cdp.md)** - Entender CDP, assincronismo e tipos
- **Padrões de design Python** - Familiaridade com padrões comuns
- **Conceitos de OOP** - Classes, herança, composição, interfaces
- **Python Assíncrono** - Confortável com `async def` e `await`  

**Se você não leu os Fundamentos**, comece por lá primeiro. A arquitetura se baseia nesses conceitos.

## Além da Arquitetura

Depois de dominar a arquitetura interna, você estará pronto para:

- **Contribuir com código**: Entender onde novos recursos se encaixam
- **Otimização de performance**: Identificar gargalos e ineficiências
- **Extensões personalizadas**: Construir sobre os padrões do Pydoll
- **Ferramentas similares**: Aplicar esses padrões a outros projetos

## Filosofia de Design

Uma boa arquitetura é **invisível**, ela não deve atrapalhar seu caminho. A arquitetura do Pydoll prioriza:

1. **Simplicidade**: Cada componente faz uma coisa bem feita
2. **Consistência**: Operações similares têm padrões similares
3. **Explicitude**: Sem mágica, sem comportamento oculto
4. **Segurança de tipos**: Capturar erros em tempo de design, não em tempo de execução
5. **Performance**: Assíncrono por padrão, paralelismo sem bloqueios (locks)

Estas não são escolhas arbitrárias, são **princípios testados em batalha** de décadas de engenharia de software.

---

## Pronto para Entender o Design?

Comece com o **[Domínio do Navegador](./browser-domain.md)** para entender como o gerenciamento de processos e o isolamento de contexto funcionam, depois progrida através dos domínios em ordem.

**É aqui que o uso se torna maestria.**

---

!!! success "Após Completar a Arquitetura"
    Depois de entender esses padrões, você os verá em toda parte na engenharia de software, não apenas no Pydoll. Estes são **padrões universais** aplicados à automação de navegadores:
    
    - Façade (Aba simplifica a complexidade do CDP)
    - Observer (Sistema de eventos para código reativo)
    - Mixin (FindElementsMixin para reuso de código)
    - Registry (Navegador rastreia instâncias de Aba)
    - Strategy (FindElements resolve seletores ideais)
    
    Boa arquitetura é **conhecimento atemporal**.

================================================
FILE: docs/pt/deep-dive/architecture/shadow-dom.md
================================================
# Arquitetura do Shadow DOM

O Shadow DOM e um dos aspectos mais desafiadores da automacao web moderna. Elementos dentro de shadow trees sao invisiveis para consultas DOM regulares, o que quebra abordagens tradicionais de automacao. Este documento explica como o Shadow DOM funciona no nivel do navegador, por que ferramentas convencionais falham com shadow roots fechados, e como o Pydoll contorna essas restricoes atraves de acesso direto via CDP.

!!! info "Guia de Uso Pratico"
    Para exemplos de uso e padroes de inicio rapido, consulte o [Guia de Pesquisa de Elementos — secao Shadow DOM](../../features/element-finding.md#suporte-a-shadow-dom).

## O que e Shadow DOM?

Shadow DOM e um padrao web que permite **encapsulamento DOM**. Ele permite que um componente tenha sua propria arvore DOM isolada (a "shadow tree") anexada a um elemento DOM regular (o "shadow host"). Elementos dentro de uma shadow tree ficam ocultos das consultas do documento principal.

```mermaid
graph TB
    subgraph "DOM Principal (Light DOM)"
        Document["document"]
        Host["div#my-component\n(shadow host)"]
        Other["p.normal-content"]
    end

    subgraph "Shadow Tree (Encapsulada)"
        SR["#shadow-root (open)"]
        Style["style"]
        Button["button.internal"]
        Input["input.private"]
    end

    Document --> Host
    Document --> Other
    Host -.->|"attachShadow()"| SR
    SR --> Style
    SR --> Button
    SR --> Input
```

### Modos do Shadow Root

Quando um componente cria um shadow root via `attachShadow()`, ele especifica um **modo**:

| Modo | Acesso JavaScript | Acesso CDP | Uso Comum |
|------|-------------------|------------|-----------|
| `open` | `element.shadowRoot` retorna o root | Acesso total via `backendNodeId` | Web components customizados (Lit, Stencil) |
| `closed` | `element.shadowRoot` retorna `null` | Acesso total via `backendNodeId` | Componentes sensiveis, formularios de pagamento |
| `user-agent` | Nao acessivel via JS | Acesso limitado | UI interna do navegador (placeholders, controles de video) |

Essa distincao e critica: **o acesso no nivel JavaScript e restrito pelo modo, mas o acesso no nivel CDP nao e.**

### Por que a Automacao Tradicional Falha

Ferramentas de automacao tradicionais dependem da execucao de JavaScript no contexto da pagina:

```javascript
// Abordagem WebDriver / Selenium
document.querySelector('#my-component')        // ✓ Encontra o host
document.querySelector('#my-component button') // ✗ Nao cruza a fronteira do shadow
element.shadowRoot                             // ✗ Retorna null para roots fechados
```

A fronteira do shadow e imposta pelo motor JavaScript do navegador. Qualquer ferramenta de automacao que executa JavaScript para encontrar elementos vai encontrar essa barreira. Isso inclui Selenium, `page.evaluate()` do Playwright, e qualquer ferramenta usando `Runtime.evaluate()` com `document.querySelector()` no nivel do documento.

## Como o Pydoll Contorna as Fronteiras do Shadow

A abordagem do Pydoll funciona em uma camada **abaixo do JavaScript**: o Chrome DevTools Protocol. O CDP tem acesso direto a representacao interna do DOM do navegador, que ignora restricoes de modo do shadow completamente.

### A Vantagem do CDP

```mermaid
sequenceDiagram
    participant User as Codigo do Usuario
    participant SR as ShadowRoot
    participant CH as ConnectionHandler
    participant CDP as Chrome CDP
    participant DOM as DOM do Navegador

    User->>SR: shadow_root.query('.btn')
    SR->>SR: _get_find_element_command(object_id)
    SR->>CH: execute_command(Runtime.callFunctionOn)
    CH->>CDP: WebSocket send
    CDP->>DOM: Executa querySelector no objeto shadow root
    DOM-->>CDP: Resultado do elemento
    CDP-->>CH: Resposta com objectId
    CH-->>SR: Dados do elemento
    SR-->>User: Instancia WebElement
```

O insight chave esta em **como o objeto shadow root e obtido** e **como as consultas sao executadas contra ele**:

1. **Descoberta**: `DOM.describeNode` com `pierce=true` retorna nos de shadow root com seu `backendNodeId`, independente do modo
2. **Resolucao**: `DOM.resolveNode` converte um `backendNodeId` em um `objectId` JavaScript que referencia o shadow root diretamente
3. **Consulta**: `Runtime.callFunctionOn` executa `this.querySelector()` no `objectId` do shadow root; isso funciona porque a chamada e feita **no proprio objeto shadow root**, nao a partir do contexto do documento

### Passo a Passo: Acesso ao Shadow Root

```mermaid
flowchart TD
    A["WebElement\n(shadow host)"]
    B["shadowRoots[] com\nbackendNodeId"]
    C["objectId JavaScript\npara o shadow root"]
    D["Instancia ShadowRoot"]
    E["WebElement\n(dentro do shadow)"]

    A -->|"DOM.describeNode\ndepth=1, pierce=true"| B
    B -->|"DOM.resolveNode\nbackendNodeId"| C
    C -->|"Criar ShadowRoot\ncom objectId"| D
    D -->|"find() / query()\nvia callFunctionOn"| E
```

#### Passo 1: Descrever o No Host

```python
# Pydoll envia este comando CDP:
{
    "method": "DOM.describeNode",
    "params": {
        "objectId": "<host-element-object-id>",
        "depth": 1,
        "pierce": true  # ← Esta e a flag chave
    }
}
```

O parametro `pierce` diz ao CDP para atravessar fronteiras do shadow ao descrever o no. A resposta inclui informacoes do shadow root independente do modo do shadow root:

```json
{
    "result": {
        "node": {
            "nodeName": "DIV",
            "shadowRoots": [
                {
                    "nodeId": 0,
                    "backendNodeId": 5,
                    "shadowRootType": "closed",
                    "childNodeCount": 4
                }
            ]
        }
    }
}
```

!!! warning "nodeId vs backendNodeId"
    Quando o dominio DOM nao esta explicitamente habilitado (que e o padrao do Pydoll para minimizar overhead), `nodeId` e sempre `0`. O `backendNodeId` e o identificador estavel e sempre disponivel. O Pydoll usa `backendNodeId` exclusivamente para resolucao de shadow root, e por isso funciona sem necessitar de `DOM.enable()`.

#### Passo 2: Resolver para Objeto JavaScript

```python
# Converter backendNodeId em um objectId utilizavel:
{
    "method": "DOM.resolveNode",
    "params": {
        "backendNodeId": 5
    }
}
```

A resposta fornece um `objectId`, um handle para o shadow root no espaco de objetos do JavaScript:

```json
{
    "result": {
        "object": {
            "objectId": "-2296764575741119861.1.3"
        }
    }
}
```

#### Passo 3: Consultar Dentro do Shadow Root

Com o `objectId` do shadow root, o Pydoll aproveita o mecanismo de busca relativa existente do `FindElementsMixin`:

```python
# Quando ShadowRoot.query('.btn') e chamado:
{
    "method": "Runtime.callFunctionOn",
    "params": {
        "functionDeclaration": "function() { return this.querySelector(\".btn\"); }",
        "objectId": "-2296764575741119861.1.3"
    }
}
```

A funcao executa com `this` vinculado ao objeto shadow root. Como shadow roots implementam as interfaces `querySelector()` e `querySelectorAll()` nativamente, seletores CSS funcionam naturalmente dentro da fronteira do shadow.

## Arquitetura do ShadowRoot

### Decisao de Design: Reutilizar FindElementsMixin

A decisao arquitetural mais critica foi fazer `ShadowRoot` herdar de `FindElementsMixin`:

```python
class ShadowRoot(FindElementsMixin):
    def __init__(self, object_id, connection_handler, mode, host_element):
        self._object_id = object_id               # Referencia CDP do shadow root
        self._connection_handler = connection_handler  # Para comunicacao CDP
        self._mode = mode                          # Enum ShadowRootType
        self._host_element = host_element          # Referencia de volta ao host
```

**Por que isso funciona**: `FindElementsMixin._find_element()` verifica `hasattr(self, '_object_id')`. Quando presente, usa `RELATIVE_QUERY_SELECTOR`, que chama `this.querySelector()` no objeto referenciado. Como shadow roots suportam `querySelector()` nativamente, `query()` com seletores CSS funciona automaticamente. A flag `_css_only = True` no `ShadowRoot` bloqueia `find()` e `query()` com XPath, lancando `NotImplementedError`.

```python
# Esta unica linha no FindElementsMixin habilita buscas em shadow root:
elif hasattr(self, '_object_id'):
    command = self._get_find_element_command(by, value, self._object_id)
```

Isso significa que `ShadowRoot` herda `query()` e `find_or_wait_element()` do mixin. Porem, a flag `_css_only = True` restringe o uso a apenas `query()` com seletores CSS; `find()` e XPath lancam `NotImplementedError`.

!!! tip "Consistencia Arquitetural"
    Este e o mesmo mecanismo que faz `WebElement.find()` buscar dentro dos filhos de um elemento: o atributo `_object_id` sinaliza "busque relativo a mim" em vez de "busque no documento inteiro." `ShadowRoot`, `WebElement` e `Tab` compartilham comportamento identico de busca de elementos atraves do `FindElementsMixin`.

### Relacionamento entre Classes

| Classe | Tem `_object_id` | Tem `_connection_handler` | Escopo de Busca |
|--------|:-:|:-:|---|
| `Tab` | Nao | Sim | Documento inteiro |
| `WebElement` | Sim | Sim | Dentro da subarvore do elemento |
| `ShadowRoot` | Sim | Sim | Dentro da shadow tree |

Todos os tres herdam de `FindElementsMixin`. A presenca ou ausencia de `_object_id` determina se as buscas sao globais no documento ou com escopo para um no especifico.

### Resolvendo Shadow Roots: Estrategia backendNodeId

O Pydoll deliberadamente usa `backendNodeId` em vez de `nodeId` para resolucao de shadow root:

| Propriedade | `nodeId` | `backendNodeId` |
|-------------|----------|-----------------|
| Requer `DOM.enable()` | Sim | Nao |
| Estavel entre chamadas describe | Nao (0 quando DOM nao habilitado) | Sim |
| Funciona para resolucao de shadow root | Apenas com DOM habilitado | Sempre |
| Overhead de performance | Maior (rastreamento do dominio DOM) | Nenhum |

Ao confiar no `backendNodeId`, o Pydoll evita o overhead de habilitar o dominio DOM enquanto mantem acesso confiavel ao shadow root. Esta e uma escolha pragmatica: a maioria dos cenarios de automacao nao precisa do stream de eventos do dominio DOM, e habilita-lo adiciona overhead de memoria e processamento para rastrear cada mutacao do DOM.

## Shadow Roots Fechados: Por que o Acesso CDP Funciona

Esta e a pergunta mais frequente: **se `element.shadowRoot` retorna `null` para shadow roots fechados em JavaScript, como o CDP pode acessa-los?**

A resposta esta em entender a arquitetura do navegador:

```mermaid
graph TB
    subgraph "Runtime JavaScript"
        JS["Codigo JavaScript"]
        API["Web APIs\n(propriedade shadowRoot)"]
    end

    subgraph "Internos do Navegador"
        CDP_Layer["Camada CDP"]
        DOM_Internal["Arvore DOM Interna"]
    end

    JS -->|"element.shadowRoot"| API
    API -->|"mode == 'closed'\n→ retorna null"| JS
    CDP_Layer -->|"DOM.describeNode\npierce=true"| DOM_Internal
    DOM_Internal -->|"Sempre retorna\nshadow tree completa"| CDP_Layer
```

**Acesso JavaScript** passa pela camada de Web API, que impoe a restricao de modo do shadow. Quando `mode='closed'`, a API retorna `null`; esta e uma fronteira de controle de acesso intencional para codigo de paginas web.

**Acesso CDP** opera abaixo da camada de Web API. Ele se comunica diretamente com a representacao interna do DOM do navegador. A restricao do modo `closed` e uma **politica no nivel JavaScript**, nao uma **restricao no nivel DOM**. A shadow tree ainda existe no DOM; ela apenas esta oculta da visao do JavaScript.

!!! info "Implicacoes de Seguranca"
    Isso e por design no DevTools Protocol. O CDP e destinado a ferramentas de depuracao e automacao que precisam de acesso total ao DOM. O modo `closed` protege conteudos do shadow de outros scripts na mesma pagina (ex: scripts de terceiros), nao da interface de depuracao do navegador. Esta e a mesma razao pela qual o DevTools do navegador consegue inspecionar shadow roots fechados no painel Elements.

### Verificacao Pratica

Voce pode verificar esse comportamento:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.dom.types import ShadowRootType

async def verify_closed_access():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('about:blank')

        # Criar um shadow root fechado via JavaScript
        await tab.execute_script("""
            const host = document.createElement('div');
            host.id = 'test-host';
            document.body.appendChild(host);
            const shadow = host.attachShadow({ mode: 'closed' });
            shadow.innerHTML = '<p class="secret">Conteudo oculto</p>';
        """)

        # JavaScript nao consegue acessar:
        result = await tab.execute_script(
            "return document.getElementById('test-host').shadowRoot",
            return_by_value=True,
        )
        js_value = result['result']['result'].get('value')
        print(f"JS shadowRoot: {js_value}")  # None

        # Mas o Pydoll consegue:
        host = await tab.find(id='test-host')
        shadow = await host.get_shadow_root()
        print(f"Modo do shadow: {shadow.mode}")  # ShadowRootType.CLOSED

        secret = await shadow.query('.secret')
        text = await secret.text
        print(f"Conteudo: {text}")  # "Conteudo oculto"

asyncio.run(verify_closed_access())
```

## Shadow Roots Aninhados

Web components frequentemente compoem outros web components, criando shadow trees em multiplos niveis:

```mermaid
graph TB
    subgraph "Light DOM"
        Host1["outer-component\n(shadow host)"]
    end

    subgraph "Shadow Tree Externa"
        SR1["#shadow-root (open)"]
        Host2["inner-component\n(shadow host)"]
        P1["p.outer-text"]
    end

    subgraph "Shadow Tree Interna"
        SR2["#shadow-root (closed)"]
        Button["button.deep-btn"]
        P2["p.inner-text"]
    end

    Host1 -.-> SR1
    SR1 --> P1
    SR1 --> Host2
    Host2 -.-> SR2
    SR2 --> P2
    SR2 --> Button
```

O Pydoll lida com isso naturalmente encadeando chamadas `get_shadow_root()`. Cada `ShadowRoot` produz instancias `WebElement` que podem ter seus proprios shadow roots:

```python
outer_host = await tab.find(tag_name='outer-component')
outer_shadow = await outer_host.get_shadow_root()        # open

inner_host = await outer_shadow.query('inner-component')
inner_shadow = await inner_host.get_shadow_root()        # closed, ainda funciona

deep_button = await inner_shadow.query('.deep-btn')
await deep_button.click()
```

Cada nivel segue o mesmo fluxo de resolucao CDP: `describeNode` depois `resolveNode` depois `ShadowRoot` com `_object_id` depois `querySelector` via `callFunctionOn`.

## Shadow Roots Dentro de IFrames

Um cenario comum no mundo real envolve shadow roots dentro de iframes cross-origin — por exemplo, captchas Cloudflare Turnstile. Isso combina dois mecanismos de isolamento: a fronteira do iframe e a fronteira do shadow.

```mermaid
graph TB
    subgraph "Pagina Principal"
        Host["div.widget\n(shadow host)"]
    end

    subgraph "Shadow Tree"
        SR1["#shadow-root"]
        IFrame["iframe\n(cross-origin)"]
    end

    subgraph "IFrame (OOPIF)"
        Body["body"]
    end

    subgraph "Shadow Tree do IFrame"
        SR2["#shadow-root"]
        Button["label.checkbox"]
    end

    Host -.-> SR1
    SR1 --> IFrame
    IFrame -.->|"processo separado"| Body
    Body -.-> SR2
    SR2 --> Button
```

O Pydoll lida com isso de forma transparente atraves da **propagacao de contexto do iframe**. Quando um `ShadowRoot` e criado, ele herda o contexto de roteamento do iframe do seu elemento host:

```python
# A cadeia completa: pagina principal → shadow root → iframe → shadow root → elemento
shadow_host = await tab.find(id='widget-container')
first_shadow = await shadow_host.get_shadow_root()

iframe = await first_shadow.query('iframe')
body = await iframe.find(tag_name='body')
second_shadow = await body.get_shadow_root()

# click() funciona corretamente — eventos de mouse roteados pela sessao OOPIF
button = await second_shadow.query('label.checkbox')
await button.click()
```

### Como a Propagacao de Contexto Funciona

IFrames cross-origin rodam em um processo separado do navegador (Out-of-Process IFrame, ou OOPIF). Comandos CDP para esses iframes devem ser roteados atraves de um `sessionId` dedicado. O Pydoll propaga esse contexto de roteamento automaticamente por toda a cadeia:

1. **IFrame resolve seu contexto**: `iframe.find()` estabelece um `IFrameContext` com `session_id` e `session_handler` para o OOPIF
2. **Elementos filhos herdam o contexto**: Elementos encontrados dentro do iframe recebem o `IFrameContext`
3. **Shadow roots herdam do host**: `ShadowRoot` copia o `_iframe_context` do seu elemento host
4. **Elementos no shadow herdam do shadow root**: Elementos encontrados via `shadow.query()` recebem o contexto propagado
5. **Comandos roteiam corretamente**: `_execute_command()` detecta o contexto herdado e roteia comandos CDP (incluindo `Input.dispatchMouseEvent` para `click()`) pela sessao OOPIF

Isso significa que coordenadas de `DOM.getBoxModel` (que sao relativas ao viewport do iframe) sao corretamente pareadas com eventos de mouse despachados para a mesma sessao OOPIF.

## Buscando Shadow Roots: find_shadow_roots()

`Tab.find_shadow_roots()` percorre toda a arvore DOM para coletar todos os shadow roots encontrados na pagina.

### Como Funciona

```
Tab.find_shadow_roots()
  ├─ DOM.getDocument(depth=-1, pierce=true)
  │   └─ Retorna arvore DOM completa com arrays shadowRoots
  ├─ Percurso recursivo da arvore: _collect_shadow_roots_from_tree()
  │   ├─ Coleta entradas shadowRoots com backendNodeId do host
  │   ├─ Percorre filhos recursivamente
  │   └─ Percorre contentDocument (iframes same-origin)
  ├─ Para cada entrada de shadow root:
  │   ├─ DOM.resolveNode(backendNodeId) → objectId
  │   └─ Resolver elemento host (melhor esforco)
  └─ Retorna list[ShadowRoot] com referencias de host
```

### Timeout: Esperando Shadow Roots

Shadow hosts sao frequentemente injetados de forma assincrona. `Tab.find_shadow_roots()` aceita um parametro `timeout` que faz polling a cada 0.5s ate que pelo menos um shadow root seja encontrado ou o timeout expire (lanca `WaitElementTimeout`). Da mesma forma, `WebElement.get_shadow_root()` tambem suporta `timeout` para esperar pelo shadow root de um elemento especifico:

```python
# Esperar ate 10 segundos pelos shadow roots
shadow_roots = await tab.find_shadow_roots(timeout=10)

# Esperar pelo shadow root de um elemento especifico
shadow = await element.get_shadow_root(timeout=5)
```

### Detalhes Importantes

- **`pierce=True`** em `DOM.getDocument` faz o navegador incluir arrays `shadowRoots` nas descricoes de nos, permitindo a descoberta de todos os shadow roots sem navegar individualmente ate cada host.
- **Conteudo de iframes same-origin** e incluido na arvore via nos `contentDocument`. A travessia os manipula.
- Cada `ShadowRoot` retornado tem uma referencia ao seu `host_element` (resolvido por melhor esforco via `DOM.resolveNode`).

### Travessia Profunda: IFrames Cross-Origin (OOPIFs)

Por padrao, iframes cross-origin (OOPIFs) **nao** sao incluidos na arvore DOM — seu conteudo vive em um processo separado do navegador. Passe `deep=True` para tambem descobrir shadow roots dentro de OOPIFs:

```python
shadow_roots = await tab.find_shadow_roots(deep=True, timeout=10)
```

Quando `deep=True` e definido, o metodo executa etapas adicionais:

```
Tab.find_shadow_roots(deep=True)
  ├─ ... (travessia do documento principal como acima) ...
  └─ _collect_oopif_shadow_roots()
      ├─ ConnectionHandler de nivel browser (sem page_id → endpoint do browser)
      ├─ Target.getTargets() → filtrar type='iframe'
      └─ Para cada target iframe:
          ├─ Target.attachToTarget(targetId, flatten=True) → sessionId
          ├─ DOM.getDocument(depth=-1, pierce=True) com sessionId
          ├─ _collect_shadow_roots_from_tree() no DOM do OOPIF
          └─ Para cada shadow root encontrado:
              ├─ DOM.resolveNode(backendNodeId) com sessionId
              ├─ Resolver elemento host (melhor esforco) com sessionId
              ├─ Criar IFrameContext(frame_id, session_handler, session_id)
              └─ Definir IFrameContext no elemento host (ou diretamente no ShadowRoot)
```

Os objetos `ShadowRoot` retornados carregam o contexto de roteamento OOPIF (`IFrameContext`), entao elementos encontrados via `shadow_root.query()` roteiam automaticamente comandos CDP pela sessao OOPIF correta. Isso e critico para cenarios como captchas Cloudflare Turnstile, onde o checkbox esta dentro de um shadow root fechado dentro de um iframe cross-origin.

## Limitacoes e Casos Especiais

### Estrategias de Seletores Dentro de Shadow Roots

!!! warning "Use Apenas query() com CSS Dentro de Shadow Roots"
    `ShadowRoot` define `_css_only = True`, o que significa que apenas `query()` com seletores CSS e suportado. `find()` e `query()` com XPath lancam `NotImplementedError`.

Shadow roots implementam nativamente `querySelector()` e `querySelectorAll()`, tornando seletores CSS a escolha natural e confiavel:

| Metodo | Dentro do Shadow Root | Notas |
|--------|:--:|---|
| `query('seletor-css')` | Totalmente suportado | Abordagem recomendada |
| `query('seletor-css', find_all=True)` | Totalmente suportado | Retorna lista de elementos |
| `find()` | Nao suportado | Lanca `NotImplementedError` |
| `query('//xpath')` | Nao suportado | Lanca `NotImplementedError` |

```python
shadow = await host.get_shadow_root()

# ✓ Recomendado: query() com seletores CSS
button = await shadow.query('button.submit')
email = await shadow.query('#email-input')
items = await shadow.query('.item', find_all=True)

# ✗ Nao suportado: find() e XPath lancam NotImplementedError
# shadow.find(id='email-input')        # NotImplementedError
# shadow.query('//button')             # NotImplementedError
```

### XPath Nao Cruza Fronteiras do Shadow

Expressoes XPath a partir da raiz do documento nao conseguem atravessar fronteiras do shadow. Esta e uma limitacao fundamental do XPath, que foi projetado antes do Shadow DOM existir:

```python
# Nao encontra conteudo shadow: XPath no nivel do documento nao cruza a fronteira
element = await tab.find(xpath='//div[@id="host"]//button')
```

### Shadow Roots User-Agent

Shadow roots internos do navegador (ex: estilizacao de placeholder de `<input>`, controles de `<video>`) sao do tipo `user-agent`. Eles sao acessiveis via CDP, mas sua estrutura interna varia entre versoes do navegador e nao faz parte de nenhum padrao web.

```python
input_element = await tab.find(tag_name='input')
try:
    ua_shadow = await input_element.get_shadow_root()
    # ua_shadow.mode == ShadowRootType.USER_AGENT
    # Estrutura interna e especifica do navegador
except ShadowRootNotFound:
    pass  # Nem todos os inputs tem shadow roots user-agent
```

!!! warning "Estabilidade de Shadow Roots User-Agent"
    Nao construa logica de automacao que dependa da estrutura interna de shadow roots user-agent. Sua estrutura DOM e um detalhe de implementacao que pode mudar entre versoes do navegador sem aviso.

### Referencias de Shadow Root Obsoletas

Se o elemento host for removido do DOM e re-adicionado (comum em aplicacoes single-page), o `objectId` do shadow root se torna obsoleto. A solucao e re-adquirir o shadow root:

```python
# Apos uma navegacao de pagina ou reconstrucao do DOM:
host = await tab.find(id='my-component', timeout=5)  # Re-encontrar o host
shadow = await host.get_shadow_root()                 # Shadow root atualizado
```

## Pontos-Chave

- **Encapsulamento Shadow DOM** oculta elementos do `querySelector()` no nivel do documento, quebrando automacao tradicional
- **CDP opera abaixo da camada de API JavaScript**, contornando restricoes de modo do shadow completamente
- **`backendNodeId`** e o identificador estavel usado para resolucao de shadow root, evitando a necessidade de habilitar o dominio DOM
- **`ShadowRoot` herda `FindElementsMixin`** com `_css_only = True`, suportando apenas `query()` com seletores CSS; `find()` e XPath lancam `NotImplementedError`
- **Shadow roots fechados** sao totalmente acessiveis porque o modo `closed` e uma politica no nivel JavaScript, nao uma restricao no nivel DOM
- **Shadow roots aninhados** funcionam naturalmente encadeando chamadas `get_shadow_root()` em cada nivel
- **Shadow roots dentro de iframes** funcionam de forma transparente atraves da propagacao automatica de contexto do iframe
- **Use seletores CSS** (`query()`) dentro de shadow roots; `find()` e XPath nao sao suportados
- **`find_shadow_roots()`** descobre todos os shadow roots na pagina; suporta `timeout` para polling e `deep=True` para iframes cross-origin (OOPIFs)
- **`get_shadow_root(timeout)`** espera pelo shadow root de um elemento especifico

## Documentacao Relacionada

- **[Guia de Pesquisa de Elementos](../../features/element-finding.md)**: Uso pratico de `find()`, `query()`, e acesso a shadow root
- **[IFrames e Contextos](../fundamentals/iframes-and-contexts.md)**: Como o Pydoll resolve e roteia comandos para iframes, incluindo tratamento de OOPIF
- **[Arquitetura do FindElements Mixin](./find-elements-mixin.md)**: Como o mecanismo `_object_id` habilita buscas com escopo
- **[Dominio WebElement](./webelement-domain.md)**: Como elementos interagem com CDP
- **[Camada de Conexao](../fundamentals/connection-layer.md)**: Comunicacao WebSocket com o navegador


================================================
FILE: docs/pt/deep-dive/architecture/tab-domain.md
================================================
# Arquitetura do Domínio da Aba (Tab)

O domínio da Aba (Tab) é a interface principal do Pydoll para automação de navegador, atuando como uma camada de orquestração que integra múltiplos domínios CDP em uma API coesa. Este documento explora sua arquitetura interna, padrões de design e as decisões de engenharia que moldam seu comportamento.

!!! info "Uso Prático"
    Para exemplos de uso e padrões práticos, consulte o [Guia de Gerenciamento de Abas](../features/automation/tabs.md).

## Visão Geral da Arquitetura

A classe `Tab` serve como uma **façade (fachada)** sobre o Chrome DevTools Protocol, abstraindo a complexidade da coordenação de múltiplos domínios em uma interface unificada.

### Estrutura de Componentes

| Componente | Relacionamento | Propósito |
|-----------|-------------|---------|
| **Tab** | Classe principal | Interface de automação primária |
| ↳ **ConnectionHandler** | Composição (própria) | Comunicação WebSocket com CDP |
| ↳ **Browser** | Referência (pai) | Acesso ao estado e configuração em nível de navegador |
| ↳ **FindElementsMixin** | Herança | Capacidades de localização de elementos |
| ↳ **WebElement** | Fábrica (cria) | Representações individuais de elementos DOM |

### Integração de Domínio CDP

O `ConnectionHandler` roteia operações da Aba (Tab) para múltiplos domínios CDP:

```
Métodos da Aba            Domínio CDP          Propósito
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
go_to(), refresh()     →   Page            →  Navegação & ciclo de vida
execute_script()       →   Runtime         →  Execução JavaScript
find(), query()        →   Runtime/DOM     →  Localização de elementos
get_cookies()          →   Storage         →  Estado da sessão
enable_network_events()→   Network         →  Monitoramento de tráfego
enable_fetch_events()  →   Fetch           →  Interceptação de requisição
```

### Responsabilidades Principais

1. **Roteamento de Comandos CDP**: Traduz operações de alto nível em comandos CDP específicos do domínio
2. **Gerenciamento de Estado**: Rastreia domínios habilitados, callbacks ativos e estado da sessão
3. **Coordenação de Eventos**: Faz a ponte entre eventos CDP e callbacks definidos pelo usuário
4. **Fábrica de Elementos**: Cria instâncias de `WebElement` a partir de strings `objectId` do CDP
5. **Gerenciamento do Ciclo de Vida**: Lida com limpeza e desalocação de recursos

## Composição vs. Herança: O FindElementsMixin

Uma decisão arquitetural chave no domínio da Aba é **herdar de `FindElementsMixin`** em vez de usar composição:

```python
class Tab(FindElementsMixin):
    def __init__(self, ...):
        self._connection_handler = ConnectionHandler(...)
        # Métodos do Mixin agora estão disponíveis na Aba
```

**Por que herança aqui?**

| Abordagem | Prós | Contras | Escolha do Pydoll |
|----------|------|------|-----------------|
| **Herança** | API limpa (`tab.find()`), compatibilidade de tipo | Acoplamento forte | Usado |
| Composição | Baixo acoplamento, flexível | Verboso (`tab.finder.find()`), sobrecarga de wrapper | Não usado |

**Justificativa:** O padrão mixin se justifica porque:

- A localização de elementos é **central para a identidade da Aba** (toda aba pode encontrar elementos)
- O mixin é **sem estado (stateless)** - ele requer apenas `_connection_handler` (injeção de dependência via duck typing)
- A ergonomia da API importa - `tab.find()` é mais intuitivo do que `tab.elements.find()`

Veja a [Análise Profunda do FindElements Mixin](./find-elements-mixin.md) para detalhes arquiteturais.

## Arquitetura de Gerenciamento de Estado

A classe Tab gerencia **múltiplas camadas de estado**:

###  1. Flags de Habilitação de Domínio

```python
class Tab:
    def __init__(self, ...):
        self._page_events_enabled = False
        self._network_events_enabled = False
        self._fetch_events_enabled = False
        self._dom_events_enabled = False
        self._runtime_events_enabled = False
        self._intercept_file_chooser_dialog_enabled = False
```

**Por que flags explícitas?**

- **Idempotência**: Chamar `enable_page_events()` duas vezes não registra duplamente
- **Inspeção de estado**: Propriedades como `tab.page_events_enabled` expõem o estado atual
- **Rastreamento de limpeza**: Sabe quais domínios precisam ser desabilitados no fechamento da aba

**Alternativa (não usada):** Consultar o CDP sobre domínios habilitados a cada verificação → Muito lento, adiciona latência.

### 2. Identidade do Alvo (Target)

```python
self._target_id: str              # Identificador CDP único
self._browser_context_id: Optional[str]  # Contexto de isolamento
self._connection_port: int        # Porta WebSocket
```

**Decisão de design:** `target_id` é o **identificador primário**, não a instância da Aba em si. Isso permite:

- **Registro de Abas em nível de Navegador**: `Browser._tabs_opened[target_id] = tab`
- **Padrão Singleton**: O mesmo `target_id` sempre retorna a mesma instância de `Tab`
- **Reutilização de conexão**: Múltiplas operações na mesma aba compartilham o WebSocket

### 3. Estado Específico de Funcionalidades

```python
self._cloudflare_captcha_callback_id: Optional[int] = None  # Para limpeza
self._request: Optional[Request] = None  # Inicialização preguiçosa (lazy)
```

**Padrão de inicialização preguiçosa (lazy):** `Request` é criado apenas quando `tab.request` é acessado:

```python
@property
def request(self) -> Request:
    if self._request is None:
        self._request = Request(self)
    return self._request
```

**Por que preguiçosa (lazy)?** A maioria das automações não usa requisições HTTP no contexto do navegador. Economiza memória e tempo de inicialização.


## Execução JavaScript: Arquitetura de Contexto Duplo

O método `execute_script()` implementa **polimorfismo de contexto** - mesma interface, diferentes comandos CDP:

| Contexto | Método CDP | Caso de Uso |
|---------|-----------|----------|
| Global (sem elemento) | `Runtime.evaluate` | `document.title`, scripts globais |
| Vinculado ao elemento | `Runtime.callFunctionOn` | Operações específicas do elemento |

**Decisão arquitetural chave:** Autodetectar o modo de execução com base na presença do parâmetro `element`, eliminando APIs separadas (`evaluate()` vs. `call_function_on()`).

**Pipeline de transformação de script:**

1. Substitui `argument` → `this` (compatibilidade com Selenium)
2. Detecta se o script já está encapsulado em `function() { }`
3. Encapsula se necessário: `script` → `function() { script }`
4. Roteia para o comando CDP apropriado

**Por que a palavra-chave `argument`?** Caminho de migração para usuários do Selenium, familiaridade da API.

!!! info "Uso Prático"
    Veja [Interações Humanizadas](../features/automation/human-interactions.md) para padrões de execução de script do mundo real.

## Integração com o Sistema de Eventos

A Aba (Tab) atua como um **wrapper (invólucro) fino** sobre o sistema de eventos do ConnectionHandler, mas adiciona uma camada importante: **execução de callback não-bloqueante**.

```python
async def on(self, event_name: str, callback: Callable, temporary: bool = False) -> int:
    # Encapsula callbacks assíncronos para executar em background
    async def callback_wrapper(event):
        asyncio.create_task(callback(event))
    
    if asyncio.iscoroutinefunction(callback):
        function_to_register = callback_wrapper  # Wrapper não-bloqueante
    else:
        function_to_register = callback  # Callbacks síncronos executam diretamente
    
    # Delega o registro ao ConnectionHandler
    return await self._connection_handler.register_callback(
        event_name, function_to_register, temporary
    )
```

**Papel arquitetural:** A Aba fornece registro de eventos com escopo de aba e semântica de execução não-bloqueante, enquanto o ConnectionHandler lida com os mecanismos internos do WebSocket e a invocação sequencial de callbacks.

**Principais características:**

- **Execução em background** via `asyncio.create_task()` para callbacks assíncronos (disparar e esquecer)
- **Autodetecção de callback síncrono/assíncrono**
- **Callbacks temporários** para manipuladores de uso único
- **ID de Callback** para remoção explícita

**Modelo de execução:**

| Camada | Comportamento | Propósito |
|-------|----------|---------|
| **Callback do usuário** | Executa em tarefa de background | Nunca bloqueia outros callbacks ou comandos CDP |
| **Wrapper da Aba** | `create_task(callback())` | Inicia tarefa de background, retorna imediatamente |
| **EventsManager** | `await wrapper()` | Invoca wrappers sequencialmente para o mesmo evento |

**Por que o wrapper?** Sem ele, um callback assíncrono lento bloquearia outros callbacks para o mesmo evento. O wrapper `create_task` garante que todos os callbacks iniciem "simultaneamente" (em tarefas separadas), impedindo que um callback lento atrase os outros.

!!! info "Arquitetura Detalhada"
    Veja a [Análise Profunda da Arquitetura de Eventos](./event-architecture.md) para mecanismos internos de roteamento de eventos e o padrão de invocação sequencial do EventsManager.
    
    **Uso prático:** [Guia do Sistema de Eventos](../features/advanced/event-system.md)

## Estado da Sessão: Gerenciamento de Cookies

**Separação arquitetural:** Cookies são roteados para o **domínio Storage** (manipulação), não para o domínio Network (observação).

```python
async def set_cookies(self, cookies: list[CookieParam]):
    return await self._execute_command(
        StorageCommands.set_cookies(cookies, self._browser_context_id)
    )
```

**Design consciente de contexto:** O parâmetro `browser_context_id` garante o isolamento de cookies, permitindo automação multi-conta.

!!! info "Gerenciamento Prático de Cookies"
    Veja o [Guia de Cookies & Sessões](../features/browser-management/cookies-sessions.md) para padrões de uso e estratégias anti-detecção.

## Captura de Conteúdo: Restrições de Alvo (Target) CDP

**Limitação crítica:** `Page.captureScreenshot` só funciona em **alvos (targets) de nível superior**. Abas de Iframe falham silenciosamente (sem campo `data` na resposta).

```python
try:
    screenshot_data = response['result']['data']
except KeyError:
    raise TopLevelTargetRequired(...)  # Guia os usuários para WebElement.take_screenshot()
```

**Implicação de design:** Antes, o Pydoll criava instâncias de Tab dedicadas para iframes. Com o novo modelo, toda interação acontece no próprio `WebElement`, então capturas e outros utilitários devem ser executados nos elementos internos (por exemplo, `await iframe_element.find(...).take_screenshot()`).

**Geração de PDF:** `Page.printToPDF` retorna dados codificados em base64. O Pydoll abstrai a E/S (I/O) de arquivo, mas os dados subjacentes são sempre base64 (especificação CDP).

!!! info "Uso Prático"
    Veja o [Guia de Screenshots & PDFs](../features/automation/screenshots-and-pdfs.md) para parâmetros, formatos e exemplos do mundo real.

## Monitoramento de Rede: Design com Estado (Stateful)

**Princípio arquitetural:** Métodos de rede exigem **estado habilitado** - verificações em tempo de execução impedem o acesso a dados inexistentes.

**Separação de armazenamento:**

- **Logs**: Armazenados em buffer no `ConnectionHandler` (recebe todos os eventos CDP)
- **Aba (Tab)**: Consulta o manipulador, sem armazenamento duplicado
- **Corpos de resposta (Response bodies)**: Recuperados sob demanda via `Network.getResponseBody(requestId)`

**Restrição de tempo crítica:** Corpos de resposta devem ser buscados **dentro de ~30s** após a resposta (coleta de lixo do navegador).

!!! info "Monitoramento de Rede na Prática"
    Veja o [Guia de Monitoramento de Rede](../features/network/monitoring.md) para rastreamento abrangente de eventos e padrões de análise.
    
    **Interceptação de requisições:** [Guia de Interceptação de Requisições](../features/network/interception.md)

## Gerenciamento de Diálogos: Padrão de Captura de Evento

**Comportamento crítico do CDP:** Diálogos JavaScript **bloqueiam todos os comandos CDP** até serem tratados.

**Solução arquitetural:** O `ConnectionHandler` captura eventos `Page.javascriptDialogOpening` imediatamente, evitando que a automação trave.

```python
# O Manipulador (Handler) armazena o evento de diálogo antes que o código do usuário rode
self._connection_handler.dialog  # Capturado pelo manipulador
# A Aba (Tab) consulta o evento armazenado
async def has_dialog(self) -> bool:
    return bool(self._connection_handler.dialog)
```

**Por que esse design?** O evento dispara antes que os callbacks do usuário sejam executados. Sem captura imediata, a automação entraria em impasse (deadlock) aguardando respostas CDP bloqueadas.

## Arquitetura de IFrame: Padrão de Reutilização de Aba

**Insight chave:** IFrames são **alvos (targets) CDP de primeira classe** → Representados como instâncias de `Tab`.

**Algoritmo de resolução de alvo:**

1. Extrai o atributo `src` do elemento iframe
2. Consulta todos os alvos CDP via `Target.getTargets()`
3. Corresponde a URL do iframe ao `targetId` do alvo
4. Verifica o registro singleton (`Browser._tabs_opened`)
5. Retorna a instância existente ou cria + registra uma nova Aba (Tab)

**Tradeoff (compromisso) de design:** Abas de Iframe herdam todos os métodos da Aba (Tab), mas alguns falham (ex: `take_screenshot()`). A alternativa (classe `IFrame` dedicada) duplicaria 90% da API para um benefício mínimo.

!!! info "Trabalhando com IFrames"
    Veja o [Guia de Interação com IFrame](../features/automation/iframes.md) para padrões práticos, frames aninhados e armadilhas comuns.

## Gerenciadores de Contexto: Limpeza Automática de Recursos

**Padrão arquitetural:** Restauração de estado + aquisição otimista de recursos.

### Principais Gerenciadores de Contexto

| Gerenciador | Padrão | Característica Chave |
|---------|---------|-------------|
| `expect_file_chooser()` | Restauração de estado | Restaura a habilitação do domínio ao sair |
| `expect_download()` | Recursos temporários | Limpeza automática de diretórios temporários |

**Design do Seletor de Arquivo (File Chooser):**

- Habilita domínios necessários (`Page`, interceptação de seletor de arquivo)
- Registra **callback temporário** (auto-remove após o primeiro disparo)
- Restaura o estado original ao sair (se os domínios estavam desabilitados antes, desabilita novamente)

**Design do Manipulador de Download:**

- Cria diretório temporário (ou usa o caminho fornecido)
- Usa `asyncio.Future` para coordenação (`will_begin_future`, `done_future`)
- Configuração em nível de navegador (downloads são por contexto, não por aba)
- Limpeza garantida via bloco `finally`

!!! info "Operações Práticas de Arquivo"
    Veja o [Guia de Operações de Arquivo](../features/automation/file-operations.md) para padrões de upload, uso do seletor de arquivos e manipulação de downloads.

## Ciclo de Vida: Fechamento e Invalidação da Aba

**Cascata de fechamento da aba:**

1. CDP fecha a aba do navegador (`Page.close`)
2. A Aba (Tab) desregistra-se de `Browser._tabs_opened`
3. O WebSocket fecha automaticamente (alvo CDP destruído)
4. Callbacks de evento sofrem coleta de lixo (garbage-collected)

**Comportamento pós-fechamento:** A instância da Aba se torna **inválida** - operações futuras falharão (WebSocket fechado).

**Decisão de design:** Sem flag `_closed` explícita. Os usuários gerenciam o ciclo de vida. A alternativa (rastreamento de estado) adiciona sobrecarga (overhead) para um benefício marginal de segurança.

## Principais Decisões Arquiteturais

### Estratégia de WebSocket por Aba

**Design escolhido:** Cada Aba (Tab) cria seu próprio ConnectionHandler com uma conexão WebSocket dedicada para `ws://localhost:port/devtools/page/{targetId}`.

**Justificativa:**

O CDP suporta **dois modelos de conexão**:

1. **Nível de Navegador**: Conexão única para `ws://localhost:port/devtools/browser/...` (usada pela instância do Navegador)
2. **Nível de Aba**: Conexões por aba para `ws://localhost:port/devtools/page/{targetId}` (usadas pelas instâncias de Aba)

O Pydoll usa **ambos**:

- O **Navegador (Browser)** tem seu próprio ConnectionHandler para operações em todo o navegador (contextos, downloads, eventos em nível de navegador)
- **Cada Aba (Tab)** tem seu próprio ConnectionHandler para operações específicas da aba (navegação, localização de elementos, eventos de aba)

**Benefícios de WebSockets por aba:**

- **Paralelismo verdadeiro**: Múltiplas abas podem executar comandos CDP simultaneamente sem esperar
- **Fluxos de eventos independentes**: Cada aba recebe apenas seus próprios eventos (sem necessidade de filtragem)
- **Falhas isoladas**: Problemas de conexão em uma aba não afetam outras
- **Roteamento simplificado**: Sem necessidade de demultiplexar mensagens por targetId

**Tradeoff (Compromisso):** Mais conexões abertas (uma por aba), mas o CDP e os navegadores lidam com isso eficientemente. Para 10 abas, são 11 conexões no total (1 navegador + 10 abas), o que é insignificante comparado às conexões HTTP que as próprias abas criam.

!!! info "Comunicação Navegador vs. Aba"
    Veja a [Arquitetura do Domínio do Navegador](./browser-domain.md) para detalhes sobre o ConnectionHandler em nível de navegador e como funciona a coordenação Navegador/Aba.

### Necessidade da Referência ao Navegador

**Por que a Aba armazena a referência `_browser`:**
- Consultas de contexto (`browser_context_id` para cookies)
- Operações em nível de navegador (comportamento de download, registro de iframe)
- Acesso à configuração (`browser.options.page_load_state`)

### Escolhas de Design da API

| Escolha | Justificativa |
|--------|-----------|
| **Propriedades Assíncronas** (`current_url`, `page_source`) | Sinaliza dados ao vivo + custo CDP |
| **Métodos `enable`/`disable` separados** | Explícito sobre implícito, corresponde à nomenclatura CDP |
| **Sem flag `_closed`** | Usuários gerenciam ciclo de vida, reduz sobrecarga |
| **Palavra-chave `argument` em scripts** | Compatibilidade com Selenium, caminho de migração |

## Relacionamento com Outros Domínios

O domínio da Aba (Tab) fica no **centro** da arquitetura do Pydoll:

```mermaid
graph TD
    Browser[Domínio do Navegador<br/>Ciclo de Vida & Processo] -->|cria| Tab[Domínio da Aba<br/>Interface de Automação]
    Tab -->|usa| ConnectionHandler[ConnectionHandler<br/>Comunicação CDP]
    Tab -->|cria| WebElement[Domínio do WebElement<br/>Interação com Elemento]
    Tab -->|herda| FindMixin[FindElementsMixin<br/>Estratégias de Localização]
    Tab -->|usa| Commands[Comandos CDP<br/>Protocolo Tipado]
    
    ConnectionHandler -->|despacha| Events[Sistema de Eventos]
    Tab -.->|referencia| Browser
    WebElement -.->|referencia| ConnectionHandler
```

**Relacionamentos chave:**

1. **Navegador → Aba**: Pai-filho. O Navegador gerencia o ciclo de vida da Aba e o estado compartilhado.
2. **Aba → ConnectionHandler**: Composição. A Aba delega a comunicação CDP.
3. **Aba → WebElement**: Fábrica. A Aba cria elementos a partir de strings `objectId`.
4. **Aba ← FindElementsMixin**: Herança. A Aba ganha métodos de localização de elementos.
5. **Aba ↔ Navegador**: Referência bidirecional. A Aba consulta o navegador para informações de contexto.

## Resumo: Filosofia de Design

O domínio da Aba (Tab) prioriza a **ergonomia da API** e a **correção (correctness)** sobre micro-otimizações:

- **Padrão Façade** abstrai a complexidade do CDP
- **Gerenciamento de estado** via flags explícitas previne habilitação dupla
- **Gerenciamento de recursos** através de gerenciadores de contexto
- **Coordenação de eventos** com execução em background (não-bloqueante)

**Principais tradeoffs (compromissos):**

| Decisão | Benefício | Custo | Veredito |
|----------|---------|------|---------|
| WebSocket por aba | Paralelismo verdadeiro | Mais conexões | Justificado |
| Herdar FindElementsMixin | API limpa | Acoplamento forte | Justificado |
| Inicialização preguiçosa (lazy) de Request | Eficiência de memória | Sobrecarga (overhead) de propriedade | Justificado |

## Leitura Adicional

**Guias práticos:**

- [Gerenciamento de Abas](../features/automation/tabs.md) - Padrões multi-aba, ciclo de vida, concorrência
- [Localização de Elementos](../features/element-finding.md) - Seletores e travessia do DOM
- [Sistema de Eventos](../features/advanced/event-system.md) - Monitoramento de navegador em tempo real

**Análises profundas de arquitetura:**

- [Arquitetura de Eventos](./event-architecture.md) - Mecanismos internos de WebSocket e roteamento de eventos
- [FindElements Mixin](./find-elements-mixin.md) - Algoritmos de resolução de seletores
- [Domínio do Navegador](./browser-domain.md) - Gerenciamento de processos e contextos

================================================
FILE: docs/pt/deep-dive/architecture/webelement-domain.md
================================================
# Arquitetura do Domínio WebElement

O domínio WebElement faz a ponte entre o código de automação de alto nível e a interação DOM de baixo nível através do Chrome DevTools Protocol. Este documento explora sua arquitetura interna, padrões de design e decisões de engenharia.

!!! info "Uso Prático"
    Para exemplos de uso e padrões de interação, veja:
    
    - [Guia de Localização de Elementos](../features/element-finding.md)
    - [Interações Humanizadas](../features/automation/human-interactions.md)
    - [Operações com Arquivos](../features/automation/file-operations.md)

## Visão Geral da Arquitetura

O WebElement representa uma **referência de objeto remoto** para um elemento DOM através do mecanismo `objectId` do CDP:

```
Código do Usuário → WebElement → ConnectionHandler → CDP Runtime → DOM do Navegador
```

**Principais características:**

- **Assíncrono por design**: Todas as operações seguem o padrão async/await do Python
- **Referência remota**: Mantém o `objectId` do CDP para o elemento no lado do navegador
- **Herança de Mixin**: Herda `FindElementsMixin` para buscas de elementos filhos
- **Estado híbrido**: Combina atributos em cache com consultas DOM em tempo real

### Estado Principal (Core)

```python
class WebElement(FindElementsMixin):
    def __init__(self, object_id: str, connection_handler: ConnectionHandler, ...):
        self._object_id = object_id              # Referência de objeto remoto CDP
        self._connection_handler = connection_handler  # Comunicação WebSocket
        self._attributes: dict[str, str] = {}    # Atributos HTML em cache
        self._search_method = method             # Como o elemento foi encontrado (debug)
        self._selector = selector                # Seletor original (debug)
```

**Por que atributos em cache?** A localização inicial do elemento retorna atributos HTML. O cache fornece acesso síncrono rápido a propriedades comuns (`id`, `class`, `tag_name`) sem chamadas CDP adicionais.

## Padrões de Design

### 1. Padrão de Comando (Command Pattern)

Todas as interações de elementos são traduzidas para comandos CDP:

| Operação do Usuário | Domínio CDP | Comando |
|----------------|-----------|---------|
| `element.click()` | Input | `Input.dispatchMouseEvent` |
| `element.text` | Runtime | `Runtime.callFunctionOn` |
| `element.bounds` | DOM | `DOM.getBoxModel` |
| `element.take_screenshot()` | Page | `Page.captureScreenshot` |

### 2. Padrão de Ponte (Bridge Pattern)

O WebElement abstrai a complexidade do protocolo CDP:

```python
async def click(self, x_offset=0, y_offset=0, hold_time=0.1):
    # API de alto nível
    
    # → Traduz para comandos CDP de baixo nível:
    # 1. DOM.getBoxModel (obter posição)
    # 2. Input.dispatchMouseEvent (pressionar)
    # 3. Input.dispatchMouseEvent (soltar)
```

### 3. Herança de Mixin para Buscas de Filhos

**Por que herdar FindElementsMixin?** Permite buscas relativas ao elemento:

```python
form = await tab.find(id='login-form')
username = await form.find(name='username')  # Busca dentro do formulário
```

**Decisão de design:** Composição (`form.finder.find()`) seria mais flexível, mas menos ergonômica. A herança foi escolhida pela simplicidade da API.

## Sistema de Propriedades Híbrido

**Inovação arquitetural:** O WebElement combina acesso a propriedades síncronas e assíncronas.

### Propriedades Síncronas (Atributos em Cache)

```python
@property
def id(self) -> str:
    return self._attributes.get('id')  # Dos atributos HTML em cache

@property  
def class_name(self) -> str:
    return self._attributes.get('class_name')  # 'class' → 'class_name' (palavra-chave do Python)
```

**Fonte:** Lista plana da resposta de localização do elemento CDP, analisada durante o `__init__`.

### Propriedades Assíncronas (Estado DOM em Tempo Real)

```python
@property
async def text(self) -> str:
    outer_html = await self.inner_html  # Chamada CDP
    soup = BeautifulSoup(outer_html, 'html.parser')
    return soup.get_text(strip=True)

@property
async def bounds(self) -> dict:
    response = await self._execute_command(DomCommands.get_box_model(self._object_id))
    # Analisar e retornar limites (bounds)
```

**Justificativa:** Texto e limites (bounds) são **dinâmicos** - eles mudam conforme a página é atualizada. Atributos são **estáticos** - capturados no momento da localização.

| Tipo de Propriedade | Acesso | Fonte | Caso de Uso |
|--------------|--------|--------|----------|
| Síncrona | `element.id` | Atributos em cache | Acesso rápido, dados estáticos |
| Assíncrona | `await element.text` | Consulta CDP ao vivo | Estado atual, dados dinâmicos |

## Implementação do Clique: Pipeline Multi-Estágio

Operações de clique seguem um pipeline sofisticado para garantir confiabilidade:

### 1. Detecção de Elemento Especial

```python
async def click(self, x_offset=0, y_offset=0, hold_time=0.1):
    # Estágio 1: Lidar com elementos especiais
    if self._is_option_tag():
        return await self.click_option_tag()  # <option> precisa de JavaScript para selecionar
```

**Por que tratamento especial?** Elementos `<option>` dentro de `<select>` não respondem a eventos de mouse. Requer JavaScript `selected = true`.

### 2. Verificação de Visibilidade

```python
    # Estágio 2: Verificar se o elemento está visível
    if not await self.is_visible():
        raise ElementNotVisible()
```

**Por que verificar?** Eventos de mouse do CDP miram coordenadas. Elementos ocultos receberiam cliques em posições erradas ou falhariam silenciosamente.

### 3. Cálculo de Posição

```python
    # Estágio 3: Rolar para visualização e obter posição
    await self.scroll_into_view()
    bounds = await self.bounds
    
    # Estágio 4: Calcular coordenadas do clique
    position_to_click = (
        bounds['x'] + bounds['width'] / 2 + x_offset,
        bounds['y'] + bounds['height'] / 2 + y_offset,
    )
```

**Suporte a offset (deslocamento):** Permite posições de clique variadas para comportamento semelhante ao humano (anti-detecção).

### 4. Despacho de Evento de Mouse

```python
    # Estágio 5: Enviar eventos de mouse CDP
    await self._execute_command(InputCommands.mouse_press(*position_to_click))
    await asyncio.sleep(hold_time)  # Espera configurável (padrão 0.1s)
    await self._execute_command(InputCommands.mouse_release(*position_to_click))
```

**Por que dois comandos?** Simula o comportamento real do mouse (pressionar → segurar → soltar). Alguns sites detectam cliques instantâneos como bots.

### Alternativa de Clique (Fallback): JavaScript

```python
async def click_using_js(self):
    """Fallback para elementos que não podem ser clicados via eventos de mouse."""
    await self.execute_script('this.click()')
```

**Quando usar:**
- Elementos ocultos (ex: inputs de arquivo estilizados com CSS)
- Elementos atrás de sobreposições (overlays)
- Cenários críticos de performance (pula verificações de visibilidade/posição)

!!! info "Cliques de Mouse vs. JavaScript"
    Veja [Interações Humanizadas](../features/automation/human-interactions.md) para saber quando usar cada abordagem e as implicações de detecção.

## Arquitetura de Screenshot: Regiões de Corte (Clip)

**Mecanismo chave:** `Page.captureScreenshot` com parâmetro `clip`.

```python
async def take_screenshot(self, path: str, quality: int = 100):
    # 1. Obter limites (bounds) do elemento (posição + dimensões)
    bounds = await self.get_bounds_using_js()
    
    # 2. Criar região de corte (clip)
    clip = Viewport(x=bounds['x'], y=bounds['y'], 
                    width=bounds['width'], height=bounds['height'], scale=1)
    
    # 3. Capturar apenas a região cortada
    screenshot = await self._execute_command(
        PageCommands.capture_screenshot(format=ScreenshotFormat.JPEG, clip=clip, quality=quality)
    )
```

**Por que limites (bounds) com JavaScript?** `DOM.getBoxModel` pode falhar para certos elementos. `getBoundingClientRect()` do JavaScript é uma alternativa (fallback) mais confiável.

**Limitação de formato:** Screenshots de elementos sempre usam JPEG (restrição do CDP com regiões de corte).

!!! info "Capacidades de Screenshot"
    Veja [Screenshots & PDFs](../features/automation/screenshots-and-pdfs.md) para comparação entre screenshots de página inteira vs. elementos.

## Contexto de Execução JavaScript

**Recurso crítico do CDP:** `Runtime.callFunctionOn(objectId, ...)` executa JavaScript **no contexto do elemento** (`this` = elemento).

```python
async def execute_script(self, script: str, return_by_value=False):
    return await self._execute_command(
        RuntimeCommands.call_function_on(self._object_id, script, return_by_value)
    )
```

**Casos de uso:**

- Verificações de visibilidade: `await element.is_visible()` → JavaScript verifica estilos computados
- Manipulação de estilo: `await element.execute_script("this.style.border = '2px solid red'")`
- Acesso a atributos: Algumas propriedades exigem JavaScript (ex: `value` para inputs)

**Alternativa (não usada):** Executar script global com seletor de elemento → Mais lento, arrisca referências obsoletas.

## Pipeline de Verificação de Estado

**Estratégia de confiabilidade:** Pré-verificar o estado do elemento antes de interações para prevenir falhas.

| Verificação | Propósito | Implementação |
|-------|---------|----------------|
| `is_visible()` | Elemento na viewport, não oculto | JavaScript: `offsetWidth > 0 && offsetHeight > 0` |
| `is_on_top()` | Sem sobreposições (overlays) bloqueando o elemento | JavaScript: `document.elementFromPoint(x, y) === this` |
| `is_interactable()` | Visível + no topo | Combina ambas as verificações |

**Por que JavaScript para visibilidade?** CSS `display: none`, `visibility: hidden`, `opacity: 0` todos afetam a visibilidade de formas diferentes. JavaScript fornece uma verificação unificada.

## Estratégias de Performance

### 1. Otimização Específica da Operação

**Princípio:** Escolher a abordagem mais rápida para cada tipo de operação.

| Operação | Abordagem Primária | Justificativa |
|-----------|-----------------|-----------|
| Extração de texto | Análise (parsing) com BeautifulSoup | Mais preciso que o `innerText` do JavaScript |
| Verificação de visibilidade | JavaScript | Chamada CDP única vs. múltiplas consultas DOM |
| Clique | Eventos de mouse CDP | Mais realista, necessário para anti-detecção |
| Limites (Bounds) | `DOM.getBoxModel` | Mais rápido que JavaScript, com JS como fallback |

### 2. Computação Local

**Minimizar viagens de ida e volta ao CDP (round-trips)** computando localmente quando possível:

```python
# Bom: Consulta única de limites (bounds), cálculo local
bounds = await element.bounds
click_x = bounds['x'] + bounds['width'] / 2 + offset_x
click_y = bounds['y'] + bounds['height'] / 2 + offset_y

# Ruim: Múltiplas chamadas CDP para matemática simples
click_x = await element.execute_script('return this.offsetLeft + this.offsetWidth / 2')
click_y = await element.execute_script('return this.offsetTop + this.offsetHeight / 2')
```

### 3. Atributos em Cache

**Decisão de design:** Armazenar atributos estáticos em cache no momento da criação:

```python
# Acesso síncrono rápido (sem chamada CDP)
element_id = element.id
element_class = element.class_name
```

**Tradeoff (Compromisso):** Atributos não refletirão mudanças em tempo de execução. Para propriedades dinâmicas, use assíncrono: `await element.text`.

## Principais Decisões Arquiteturais

| Decisão | Justificativa |
|----------|-----------|
| **Herdar FindElementsMixin** | Permite buscas de filhos, mantém consistência da API |
| **Propriedades híbridas síncronas/assíncronas** | Equilibra performance (síncrono) com dados atualizados (assíncrono) |
| **Alternativas (fallbacks) com JavaScript** | Confiabilidade acima da performance para operações críticas |
| **Detecção de elementos especiais** | `<option>`, `<input type="file">` exigem tratamento único |
| **Verificações de visibilidade pré-clique** | Falhar rápido (fail fast) com erros claros vs. falhas silenciosas |

## Resumo

O domínio WebElement faz a ponte entre o código de automação Python e o DOM do navegador através de:

- **Referências de objetos remotos** via `objectId` do CDP
- **Sistema de propriedades híbrido** equilibrando atributos síncronos e estado assíncrono
- **Pipelines de interação multi-estágio** garantindo confiabilidade
- **Tratamento especializado** para variações de tipos de elementos

**Principais tradeoffs (compromissos):**

| Decisão | Benefício | Custo | Veredito |
|----------|---------|------|---------|
| Herança de Mixin | API limpa | Acoplamento forte | Justificado |
| Atributos em cache | Acesso síncrono rápido | Risco de dados obsoletos | Justificado |
| Alternativas (fallbacks) com JavaScript | Confiabilidade | Perda de performance | Justificado |
| Pré-verificações de visibilidade | Erros claros | Chamadas CDP extras | Justificado |

## Leitura Adicional

**Guias práticos:**

- [Localização de Elementos](../features/element-finding.md) - Localizando elementos, seletores
- [Interações Humanizadas](../features.automation/human-interactions.md) - Clicar, digitar, realismo
- [Operações com Arquivos](../features/automation/file-operations.md) - Uploads e downloads de arquivos

**Análises profundas de arquitetura:**

- [FindElements Mixin](./find-elements-mixin.md) - Pipeline de resolução de seletores
- [Domínio da Aba (Tab)](./tab-domain.md) - A Aba como fábrica de elementos
- [Camada de Conexão](./connection-layer.md) - Comunicação WebSocket

================================================
FILE: docs/pt/deep-dive/fingerprinting/behavioral-fingerprinting.md
================================================
# Fingerprinting Comportamental

O fingerprinting comportamental analisa como os usuários interagem com aplicações web, em vez de quais ferramentas eles usam. Enquanto fingerprints de rede e navegador podem ser falsificados definindo os valores corretos, o comportamento humano segue padrões biomecânicos difíceis de replicar de forma convincente. Sistemas de detecção coletam movimentos de mouse, tempos de digitação, comportamento de scroll e sequências de interação, e então usam modelos estatísticos para distinguir humanos de automação.

Este documento cobre as técnicas de detecção, a ciência por trás delas, e como os recursos de humanização do Pydoll abordam cada vetor.

!!! info "Navegação do Módulo"
    - [Network Fingerprinting](./network-fingerprinting.md): Fingerprinting de protocolo TCP/IP, TLS, HTTP/2
    - [Browser Fingerprinting](./browser-fingerprinting.md): Canvas, WebGL, propriedades do navigator
    - [Técnicas de Evasão](./evasion-techniques.md): Contramedidas práticas

## Análise de Movimento do Mouse

O movimento do mouse é um dos indicadores comportamentais mais poderosos porque o controle motor humano segue leis biomecânicas que automação simples não consegue replicar. Sistemas de detecção coletam eventos `mousemove` (cada um contendo coordenadas x, y e um timestamp) e analisam a trajetória em busca de propriedades que distinguem movimento orgânico de teleporte programático do cursor.

### Lei de Fitts

A Lei de Fitts descreve o tempo necessário para mover um ponteiro até um alvo. A formulação de Shannon (MacKenzie, 1992), que é a versão mais amplamente utilizada, estabelece:

```
T = a + b * log2(D/W + 1)
```

Onde `T` é o tempo de movimento, `a` é uma constante representando tempo de reação/início, `b` é uma constante representando a velocidade inerente do dispositivo de entrada, `D` é a distância até o alvo, e `W` é a largura (tamanho) do alvo. A relação logarítmica significa que dobrar a distância adiciona uma quantidade fixa de tempo, enquanto reduzir pela metade o tamanho do alvo adiciona a mesma quantidade fixa.

As implicações para detecção de bots são significativas. Humanos levam mais tempo para alcançar alvos pequenos e distantes e alcançam alvos grandes e próximos rapidamente. Eles aceleram no início de um movimento, atingem velocidade máxima aproximadamente no meio do caminho e desaceleram ao se aproximar do alvo. Bots que movem o cursor em tempo constante independentemente da distância e tamanho do alvo violam a Lei de Fitts e são trivialmente detectáveis.

Sistemas de detecção medem o tempo de movimento para cada evento de clique, calculam o tempo esperado a partir da distância e tamanho do alvo, e sinalizam movimentos significativamente mais rápidos do que a Lei de Fitts prevê ou que não mostram correlação entre distância/tamanho e tempo de movimento.

### Forma da Trajetória

Movimentos humanos da mão entre dois pontos não são linhas retas. A pesquisa de Abend, Bizzi e Morasso (1982) mostrou que os caminhos das mãos são tipicamente curvados devido a restrições biomecânicas das articulações e músculos do braço. Flash e Hogan (1985) demonstraram que movimentos de alcance humanos seguem trajetórias de jerk mínimo, onde a trajetória minimiza a integral do jerk (a derivada da aceleração) ao longo da duração do movimento. O perfil de velocidade resultante tem forma de sino e é descrito por um polinômio quíntico (grau 5):

```
x(t) = x0 + (xf - x0) * (10t^3 - 15t^4 + 6t^5)
```

onde `t` é o tempo normalizado de 0 a 1, e `x0`/`xf` são as posições inicial e final. Isso produz aceleração suave a partir do repouso, velocidade máxima aproximadamente no meio do caminho e desaceleração suave de volta ao repouso.

Sistemas de detecção analisam curvatura da trajetória, perfis de velocidade e padrões de aceleração. Os sinais específicos que procuram incluem:

**Detecção de linha reta.** Um caminho perfeitamente reto entre dois pontos (curvatura zero em cada amostra) é o sinal de bot mais óbvio. Caminhos humanos sempre têm alguma curvatura devido às articulações rotacionais do braço.

**Velocidade constante.** Humanos mostram um perfil de velocidade em forma de sino (acelerar, pico, desacelerar). Uma velocidade constante durante todo o movimento indica interpolação linear, que é o comportamento padrão da maioria das ferramentas de automação.

**Ausência de sub-movimentos.** Movimentos longos são compostos por múltiplos sub-movimentos sobrepostos (Meyer et al., 1988), cada um com seu próprio pico de velocidade. Um movimento cobrindo 500+ pixels com um único pico de velocidade suave é suspeito; movimentos reais dessa distância tipicamente mostram 2-4 picos de velocidade.

**Sem overshoot.** Humanos frequentemente ultrapassam o alvo ligeiramente (por 5-15 pixels) e fazem uma pequena correção de volta. Movimentos perfeitamente precisos que acertam exatamente no alvo toda vez são estatisticamente improváveis.

### Entropia de Movimento

Entropia, neste contexto, mede a imprevisibilidade do caminho do mouse. Sistemas de detecção dividem a trajetória em segmentos, medem a mudança de direção em cada ponto e calculam a entropia de Shannon sobre a distribuição de mudanças de direção. Uma linha reta tem entropia zero (cada segmento aponta na mesma direção). Uma caminhada aleatória tem entropia máxima. O movimento humano tem entropia moderada a alta, refletindo a combinação de direção intencional e variabilidade involuntária.

Entropia baixa em muitos movimentos de mouse em uma sessão é um sinal forte de bot, mesmo que movimentos individuais tenham curvatura plausível.

### Humanização de Mouse do Pydoll

O Pydoll implementa humanização abrangente do mouse através do parâmetro `humanize=True` em operações de clique. Quando habilitado, o módulo de mouse gera movimentos que abordam cada um dos vetores de detecção descritos acima:

O caminho segue uma curva Bezier cúbica com pontos de controle aleatorizados, produzindo curvatura natural em vez de linhas retas. A velocidade ao longo do caminho segue um perfil de jerk mínimo (`10t^3 - 15t^4 + 6t^5`), produzindo a curva de velocidade em forma de sino que a Lei de Fitts prevê. A duração do movimento é calculada usando a Lei de Fitts com constantes configuráveis (`a=0.070`, `b=0.150` por padrão).

Tremor fisiológico é simulado adicionando ruído Gaussiano às posições do cursor, com amplitude inversamente proporcional à velocidade (tremor é mais visível quando a mão se move lentamente, o que corresponde à fisiologia real). Overshoot ocorre com 70% de probabilidade, ultrapassando o alvo em 3-12% da distância total antes de fazer um movimento de correção. Micro-pausas (15-40ms) ocorrem com 3% de probabilidade durante o movimento, simulando hesitações breves.

```python
# Clique humanizado básico
await element.click(humanize=True)

# A classe Mouse também pode ser usada diretamente para mais controle
from pydoll.interactions.mouse import Mouse

mouse = Mouse(connection_handler)
await mouse.click(500, 300, humanize=True)
```

!!! note "O que o Pydoll Não Faz"
    A humanização de mouse do Pydoll atualmente não modela sub-movimentos para distâncias muito longas (o caminho é um único segmento Bezier). Para a maioria das interações web, onde distâncias são menores que 500 pixels, isso é suficiente. Movimentos extremamente longos (travessias diagonais de tela inteira) podem se beneficiar de suporte futuro a múltiplos segmentos.

## Dinâmica de Digitação

A dinâmica de digitação analisa os padrões de tempo da entrada do teclado. A técnica remonta aos operadores de telégrafo na década de 1850, que podiam identificar uns aos outros pelo "punho" do código Morse (padrão de tempo característico). Sistemas modernos medem o tempo com precisão de milissegundos através de eventos `keydown` e `keyup`.

### Características de Tempo

As duas medições fundamentais são tempo de permanência (a duração entre `keydown` e `keyup` para uma única tecla, tipicamente 50-200ms para humanos) e tempo de voo (a duração entre soltar uma tecla e pressionar a próxima, tipicamente 80-400ms). A combinação de tempos de permanência e voo para pares de teclas consecutivas é chamada de latência de digrafo.

Latências de digrafo não são uniformes. Elas dependem do par de teclas específico (bigrama) sendo digitado, porque digitação é uma habilidade motora onde sequências comuns são armazenadas como memória procedural. Os fatores biomecânicos chave são:

**Alternância de mãos.** Bigramas digitados com mãos alternadas (como "th", onde "t" é mão esquerda e "h" é mão direita no QWERTY) são geralmente mais rápidos que bigramas da mesma mão (como "de", onde ambas as teclas são na mão esquerda). A mão alternada pode começar seu movimento enquanto a primeira mão ainda está completando sua tecla.

**Distância dos dedos.** Transições de tecla inicial para tecla inicial são mais rápidas. Alcançar a fileira superior ou inferior adiciona tempo proporcional à distância física que o dedo deve percorrer.

**Independência dos dedos.** Combinações de dedo anelar e mínimo na mesma mão são mais lentas que combinações de indicador e médio, porque o anelar e o mínimo compartilham tendões e têm menos controle motor independente.

**Efeitos de frequência.** Bigramas frequentemente digitados (como "th", "er", "in" em inglês) são executados mais rapidamente devido à memória motora, independentemente de seu layout físico.

### Sinais de Detecção

Sistemas de detecção procuram vários sinais que distinguem digitação humana de automação:

**Tempo de permanência zero ou constante.** Muitas ferramentas de automação despacham eventos `keydown` e `keyup` com atraso zero ou quase zero entre eles (menos de 5ms). Pressionamentos reais de teclas têm tempos de permanência mensuráveis. Tempo de permanência constante em todas as teclas é igualmente suspeito.

**Tempo de voo uniforme.** Definir um intervalo fixo entre teclas (como `type_text("hello", interval=0.1)`) produz tempo perfeitamente regular que é trivialmente detectável. Tempos de voo humanos variam por bigrama, fadiga e carga cognitiva.

**Sem erros de digitação.** Em entrada de texto extensa (50+ caracteres), a ausência completa de pressionamentos de backspace ou delete é incomum. Humanos cometem erros a uma taxa de aproximadamente 1-5% dependendo da proficiência de digitação e complexidade do texto.

**Velocidade sobre-humana.** Digitação sustentada acima de 150 WPM está além da capacidade de todos exceto digitadores competitivos de elite. Ferramentas de automação que despacham caracteres mais rápido que isso são imediatamente sinalizadas.

### Humanização de Teclado do Pydoll

O `type_text(humanize=True)` do Pydoll aborda cada vetor de detecção com parâmetros configuráveis:

Atrasos entre teclas são extraídos de uma distribuição uniforme (30-120ms por padrão) em vez de um intervalo fixo. Caracteres de pontuação (`.!?;:,`) recebem atraso adicional (80-180ms), simulando a pausa que ocorre quando um digitador considera a estrutura da frase. Pausas de pensamento (300-700ms) ocorrem com 2% de probabilidade, simulando breves momentos de reflexão. Pausas de distração (500-1200ms) ocorrem com 0.5% de probabilidade, simulando o digitador desviando o olhar ou sendo brevemente interrompido.

Erros de digitação realistas ocorrem com aproximadamente 2% de probabilidade por caractere, com cinco tipos de erro distintos ponderados por sua frequência no mundo real: erros de tecla adjacente (55%, pressionar uma tecla vizinha no QWERTY), transposições (20%, trocar dois caracteres consecutivos), pressionamentos duplos (12%, pressionar uma tecla duas vezes), caracteres pulados (8%, hesitar antes de digitar corretamente) e espaços esquecidos (5%, esquecer um espaço entre palavras). Cada tipo de erro inclui uma sequência de recuperação realista (pausa, backspace, correção) com tempo apropriado.

```python
# Digitação humanizada
await element.type_text("Hello, world!", humanize=True)

# Com configuração de tempo personalizada
from pydoll.interactions.keyboard import Keyboard, TimingConfig, TypoConfig

config = TimingConfig(
    keystroke_min=0.04,
    keystroke_max=0.15,
    thinking_probability=0.03,
)
keyboard = Keyboard(connection_handler, timing_config=config)
await keyboard.type_text("Custom timing example", humanize=True)
```

!!! note "O que o Pydoll Não Faz"
    A humanização de teclado do Pydoll usa atrasos aleatórios uniformes em vez de temporização ciente de bigramas. Não modela variação de tempo de permanência por tecla ou diferenças de velocidade de alternância de mãos. Para a maioria dos cenários de automação (preenchimento de formulários, consultas de busca), variação uniforme é suficiente para passar na detecção comportamental. Aplicações que requerem evasão de biometria de digitação em nível de autenticação precisariam de modelos de tempo personalizados.

## Análise de Comportamento de Scroll

O fingerprinting de scroll analisa como os usuários navegam verticalmente (e horizontalmente) pelo conteúdo da página. A distinção entre scroll humano e automatizado é marcante: chamadas programáticas `window.scrollTo()` produzem saltos instantâneos e discretos, enquanto scroll humano via roda do mouse, trackpad ou toque produz um fluxo de pequenos eventos incrementais com momentum e desaceleração.

### Características Físicas do Scroll

Scroll por roda do mouse produz eventos `wheel` discretos com valores de delta consistentes (tipicamente 100 ou 120 pixels por notch, dependendo do SO e navegador). Os eventos chegam em intervalos irregulares refletindo quão rapidamente o usuário gira a roda. Scroll por trackpad produz muitos eventos pequenos com deltas decrescentes, simulando momentum físico. Scroll por toque é similar ao trackpad mas com deltas iniciais maiores e caudas de desaceleração mais longas.

Sistemas de detecção analisam a distribuição de delta, timing entre eventos e curva de desaceleração. Uma chamada `scrollTo(0, 5000)` produz um único salto sem eventos intermediários, que é fundamentalmente diferente das centenas de eventos incrementais que um scroll humano gera.

### Sinais de Detecção

**Scroll instantâneo.** Usar `window.scrollTo()` ou `window.scrollBy()` com valores grandes produz zero eventos de scroll intermediários. Sistemas de detecção que escutam eventos `scroll` veem a posição de scroll mudar em um único frame.

**Deltas uniformes.** Simulação programática de scroll que despacha eventos wheel com valores de delta constantes (ex: sempre 100 pixels) carece da variação natural no scroll humano, onde valores de delta flutuam em 10-30% devido à pressão inconsistente dos dedos.

**Sem desaceleração.** Scroll humano, especialmente em trackpads, tem uma fase de momentum onde o scroll continua após o usuário levantar o dedo, com velocidade exponencialmente decrescente. Scroll automatizado que para abruptamente carece dessa cauda de desaceleração.

**Ausência de mudanças de direção.** Humanos frequentemente scrollam demais e scrollam de volta ligeiramente, ou pausam no meio de uma página para ler conteúdo. Scroll automatizado que se move em uma direção com velocidade constante sem pausas ou reversões é suspeito.

### Humanização de Scroll do Pydoll

O módulo de scroll do Pydoll implementa scroll humanizado através de `scroll.by(position, distance, humanize=True)`:

O scroll segue uma curva de easing Bezier cúbica (pontos de controle `0.645, 0.045, 0.355, 1.0` por padrão), produzindo aceleração e desaceleração naturais. Jitter por frame de ±3 pixels adiciona variação aos valores de delta. Micro-pausas (20-50ms) ocorrem com 5% de probabilidade, simulando paradas breves de leitura. Overshoot ocorre com 15% de probabilidade, scrollando 2-8% além do alvo e corrigindo de volta. Para grandes distâncias, o scroll é dividido em múltiplos gestos de "flick" (100-1200 pixels cada), simulando como um usuário real scrolla por uma página longa com deslizes repetidos em vez de um único movimento contínuo.

```python
from pydoll.interactions.scroll import Scroll, ScrollPosition

scroll = Scroll(connection_handler)

# Scroll humanizado para baixo 800 pixels
await scroll.by(ScrollPosition.Y, 800, humanize=True)

# Scroll até o topo/fundo usa múltiplos flicks semelhantes a humanos
await scroll.to_bottom(humanize=True)
```

## Vetores de Detecção Adicionais

Além da análise de mouse, teclado e scroll, sistemas de detecção sofisticados monitoram vários outros sinais comportamentais.

### Foco e Visibilidade

A API de Visibilidade de Página (`document.visibilityState`) e eventos de foco (`window.onfocus`, `window.onblur`) revelam se o usuário está ativamente visualizando a página. Uma sessão de usuário real inclui trocas de aba, minimizações de janela e períodos de inatividade. Um script de automação que mantém foco contínuo por horas sem um único evento blur é comportamentalmente anômalo. Da mesma forma, `document.hasFocus()` retornando `true` continuamente por períodos prolongados é incomum.

### Padrões de Inatividade

Usuários reais têm períodos naturais de inatividade: lendo conteúdo, pensando antes de agir, sendo distraídos. Sistemas de detecção medem a distribuição de tempos de inatividade entre interações. Uma sessão onde cada ação segue a anterior dentro de 100-500ms sem pausas mais longas segue um padrão que é estatisticamente distinto da navegação humana, onde períodos de inatividade de 2-30 segundos entre ações são normais.

### Integridade de Sequência de Eventos

Navegadores geram sequências de eventos específicas para interações do usuário. Um clique de mouse produz `pointerdown`, `mousedown`, `pointerup`, `mouseup`, `click` nessa ordem, precedido por eventos `pointermove`/`mousemove` mostrando o cursor se aproximando do alvo do clique. Ferramentas de automação que despacham um evento `click` sem o movimento precedente e eventos de ponteiro são detectáveis através de análise de sequência de eventos.

O despacho de eventos baseado em CDP do Pydoll gera sequências completas de eventos porque usa a simulação de entrada do Chrome, que produz a mesma cadeia de eventos que entrada real do usuário.

## Detecção por Machine Learning

Sistemas anti-bot modernos (DataDome, Akamai Bot Manager, Cloudflare Bot Management, PerimeterX/HUMAN Security) não usam regras de limiar simples. Eles treinam modelos de machine learning em milhões de sessões de usuários reais e milhões de sessões de bots conhecidos, aprendendo a distinguir humanos de automação com base em 50+ características simultaneamente.

Esses modelos capturam propriedades estatísticas difíceis de enumerar como regras individuais: a distribuição conjunta de velocidade de movimento e curvatura, a correlação entre velocidade de digitação e taxa de erro, a relação entre profundidade de scroll e tempo de leitura, e o "ritmo" geral de uma sessão de navegação. Um sistema que passa em cada verificação individual mas tem correlações sutilmente erradas entre características ainda pode ser sinalizado por um modelo bem treinado.

A implicação prática é que a evasão comportamental deve ser consistente em todos os tipos de interação, não apenas individualmente plausível. O parâmetro `humanize=True` do Pydoll fornece uma camada de humanização coerente entre interações de mouse, teclado e scroll, mas o desenvolvedor ainda é responsável pela plausibilidade comportamental de nível mais alto: adicionar atrasos de leitura entre carregamentos de página, variar o ritmo de workflows de múltiplas páginas e incluir períodos naturais de inatividade.

## Referências

- Fitts, P. M. (1954). The Information Capacity of the Human Motor System in Controlling the Amplitude of Movement. Journal of Experimental Psychology.
- MacKenzie, I. S. (1992). Fitts' Law as a Research and Design Tool in Human-Computer Interaction. Human-Computer Interaction.
- Flash, T., & Hogan, N. (1985). The Coordination of Arm Movements: An Experimentally Confirmed Mathematical Model. Journal of Neuroscience.
- Abend, W., Bizzi, E., & Morasso, P. (1982). Human Arm Trajectory Formation. Brain.
- Meyer, D. E., Abrams, R. A., Kornblum, S., Wright, C. E., & Smith, J. E. K. (1988). Optimality in Human Motor Performance. Psychological Review.
- Ahmed, A. A. E., & Traore, I. (2007). A New Biometric Technology Based on Mouse Dynamics. IEEE TDSC.


================================================
FILE: docs/pt/deep-dive/fingerprinting/browser-fingerprinting.md
================================================
# Browser Fingerprinting

O browser fingerprinting identifica clientes analisando propriedades expostas através de APIs JavaScript, cabeçalhos HTTP e motores de renderização. Diferentemente do network fingerprinting, que examina sinais de nível de protocolo do kernel do SO e biblioteca TLS, o browser fingerprinting tem como alvo a camada de aplicação: o navegador específico, sua versão, sua configuração e o hardware em que roda. Esses sinais são acessíveis a qualquer site através de APIs web padrão, e a combinação de propriedades suficientes cria um fingerprint que é frequentemente único entre milhões de visitantes.

!!! info "Navegação do Módulo"
    - [Network Fingerprinting](./network-fingerprinting.md): Fingerprinting de protocolo TCP/IP, TLS, HTTP/2
    - [Behavioral Fingerprinting](./behavioral-fingerprinting.md): Análise de mouse, teclado, scroll
    - [Técnicas de Evasão](./evasion-techniques.md): Contramedidas práticas

## Propriedades JavaScript do Navigator

O objeto `navigator` é a fonte mais rica de dados de fingerprinting de navegador. Ele expõe dezenas de propriedades que revelam o navegador, suas capacidades e o sistema em que roda. Sistemas de detecção coletam essas propriedades, fazem referência cruzada entre elas e contra cabeçalhos HTTP, e sinalizam inconsistências.

O seguinte JavaScript coleta o conjunto central de propriedades que sistemas de fingerprinting tipicamente examinam:

```javascript
const fingerprint = {
    // Identidade
    userAgent: navigator.userAgent,
    platform: navigator.platform,
    vendor: navigator.vendor,

    // Idioma e locale
    language: navigator.language,
    languages: navigator.languages,

    // Hardware
    hardwareConcurrency: navigator.hardwareConcurrency,
    deviceMemory: navigator.deviceMemory,
    maxTouchPoints: navigator.maxTouchPoints,

    // Recursos
    cookieEnabled: navigator.cookieEnabled,
    doNotTrack: navigator.doNotTrack,
    webdriver: navigator.webdriver,

    // Tela
    screenWidth: screen.width,
    screenHeight: screen.height,
    colorDepth: screen.colorDepth,
    devicePixelRatio: window.devicePixelRatio,

    // Chrome do navegador (barra de ferramentas, dimensões da scrollbar)
    chromeHeight: window.outerHeight - window.innerHeight,
    chromeWidth: window.outerWidth - window.innerWidth,

    // Timezone
    timezone: Intl.DateTimeFormat().resolvedOptions().timeZone,
    timezoneOffset: new Date().getTimezoneOffset(),
};
```

Várias dessas propriedades merecem atenção individual porque carregam mais peso de fingerprinting ou são mais comumente mal configuradas por ferramentas de automação.

### Consistência de Platform e User-Agent

A propriedade `navigator.platform` retorna uma string como `Win32`, `MacIntel` ou `Linux x86_64`. Sistemas de detecção comparam isso com o cabeçalho User-Agent. Se o User-Agent HTTP afirma `Windows NT 10.0` mas `navigator.platform` retorna `Linux x86_64`, a inconsistência é um sinal forte. Este é um dos erros mais comuns em automação: definir um User-Agent personalizado via `--user-agent=` sem também sobrescrever a plataforma.

### Propriedades de Hardware

`navigator.hardwareConcurrency` retorna o número de núcleos lógicos de CPU. Um valor de 1 ou 2 sugere uma VM ou container mínimo em vez de uma máquina real de usuário. `navigator.deviceMemory` reporta RAM aproximada em gigabytes (0.25, 0.5, 1, 2, 4, 8). Esta propriedade só está disponível em navegadores Chromium; Firefox e Safari retornam `undefined`. Ambos os valores devem ser consistentes com o dispositivo declarado: um User-Agent alegando um desktop moderno mas reportando 1 núcleo e 0.5 GB de RAM é suspeito.

### Propriedade WebDriver

A propriedade `navigator.webdriver` é `true` quando o navegador é controlado por automação baseada em WebDriver (Selenium, Playwright em modo WebDriver). Este é o indicador de automação mais óbvio. O Pydoll usa CDP (Chrome DevTools Protocol) diretamente, que não define esta flag. Em um navegador controlado pelo Pydoll, `navigator.webdriver` é `undefined`, correspondendo ao comportamento de uma sessão normal de usuário.

### Plugins

A propriedade `navigator.plugins` foi historicamente um forte vetor de fingerprinting porque diferentes navegadores e configurações de SO expunham diferentes listas de plugins. Navegadores Chromium modernos (Chrome 90+) retornam uma lista fixa de cinco plugins relacionados a PDF independentemente do estado real dos plugins:

```javascript
// Chrome moderno sempre retorna estes 5 plugins:
// 1. PDF Viewer
// 2. Chrome PDF Viewer
// 3. Chromium PDF Viewer
// 4. Microsoft Edge PDF Viewer
// 5. WebKit built-in PDF
console.log(navigator.plugins.length); // 5
```

Um equívoco comum alega que navegadores modernos retornam arrays vazios para `navigator.plugins`. Isto é incorreto. Retornar um array vazio é em si um sinal de detecção que sugere modo headless ou um cliente HTTP não-navegador.

### Dimensões de Tela e Janela

A diferença entre `window.outerWidth`/`outerHeight` e `window.innerWidth`/`innerHeight` representa o chrome do navegador (barras de ferramentas, scrollbars, moldura da janela). Navegadores headless frequentemente reportam diferença zero porque não têm UI visível. Sistemas de detecção sinalizam clientes onde `outerWidth` é igual a `innerWidth` como potencialmente headless. Da mesma forma, `screen.width` correspondendo a `innerWidth` exatamente sugere uma janela headless maximizada em vez de uma sessão desktop normal.

O `devicePixelRatio` varia por display: monitores padrão reportam `1.0`, displays Retina de MacBook reportam `2.0`, e smartphones reportam `2.0` a `3.0`. Este valor deve ser consistente com o dispositivo declarado no User-Agent.

## User-Agent Client Hints

Navegadores Chromium modernos (Chrome, Edge, Opera) complementam a string User-Agent tradicional com cabeçalhos Client Hints: `Sec-CH-UA`, `Sec-CH-UA-Platform`, `Sec-CH-UA-Mobile`, e (sob demanda) valores de maior entropia como `Sec-CH-UA-Full-Version-List`, `Sec-CH-UA-Arch` e `Sec-CH-UA-Bitness`.

```http
Sec-CH-UA: "Chromium";v="120", "Google Chrome";v="120", "Not:A-Brand";v="99"
Sec-CH-UA-Mobile: ?0
Sec-CH-UA-Platform: "Windows"
```

Client Hints fornecem dados estruturados e legíveis por máquina que são mais difíceis de falsificar de forma inconsistente. Um servidor pode comparar o cabeçalho `Sec-CH-UA-Platform` com `navigator.platform`, a string User-Agent e o fingerprint TCP/IP. Qualquer inconsistência entre essas camadas é um sinal de detecção.

O equivalente no lado JavaScript é `navigator.userAgentData`, que expõe `brands`, `mobile` e `platform` como valores de baixa entropia, e `getHighEntropyValues()` para informações detalhadas de versão, arquitetura e bitness:

```javascript
// Baixa entropia (sempre disponível, sem necessidade de permissão)
console.log(navigator.userAgentData.brands);
// [{brand: "Chromium", version: "120"}, {brand: "Google Chrome", version: "120"}, ...]
console.log(navigator.userAgentData.platform); // "Windows"
console.log(navigator.userAgentData.mobile);   // false

// Alta entropia (requer promise, pode requerer permissão)
const highEntropy = await navigator.userAgentData.getHighEntropyValues([
    'architecture', 'bitness', 'platformVersion', 'uaFullVersion'
]);
// {architecture: "x86", bitness: "64", platformVersion: "15.0.0", ...}
```

!!! warning "Suporte de Navegador"
    Client Hints são um recurso exclusivo do Chromium. Firefox e Safari não enviam cabeçalhos `Sec-CH-UA` e não expõem `navigator.userAgentData`. Se o User-Agent alega Firefox mas o servidor recebe cabeçalhos Client Hints, o cliente não é Firefox.

## Canvas Fingerprinting

O canvas fingerprinting explora o fato de que a API Canvas do HTML5 produz saída de pixels sutilmente diferente em diferentes combinações de GPU, driver gráfico, SO e navegador. A variação vem de diferenças na rasterização de fontes (renderização sub-pixel, hinting, anti-aliasing), execução de shader específica da GPU, precisão de ponto flutuante no pipeline gráfico e bibliotecas de renderização de texto no nível do SO (DirectWrite no Windows, Core Text no macOS, FreeType no Linux).

A técnica desenha texto, formas e gradientes em um canvas oculto, extrai os dados de pixel e faz hash:

```javascript
function generateCanvasFingerprint() {
    const canvas = document.createElement('canvas');
    canvas.width = 220;
    canvas.height = 30;
    const ctx = canvas.getContext('2d');

    // Retângulo colorido (expõe diferenças de blending)
    ctx.fillStyle = '#f60';
    ctx.fillRect(125, 1, 62, 20);

    // Texto com emoji (maximiza variação de renderização)
    ctx.font = '14px Arial';
    ctx.textBaseline = 'alphabetic';
    ctx.fillStyle = '#069';
    ctx.fillText('Cwm fjordbank glyphs vext quiz, 😃', 2, 15);

    // Sobreposição semi-transparente (expõe diferenças de composição alfa)
    ctx.fillStyle = 'rgba(102, 204, 0, 0.7)';
    ctx.fillText('Cwm fjordbank glyphs vext quiz, 😃', 4, 17);

    return canvas.toDataURL();
}
```

O pangrama "Cwm fjordbank glyphs vext quiz" é escolhido porque usa combinações incomuns de caracteres que estressam a renderização de fontes. O emoji adiciona outra dimensão porque a renderização de emoji varia significativamente entre sistemas operacionais. A sobreposição semi-transparente testa composição alfa, que difere entre implementações de GPU.

O canvas fingerprinting é eficaz para distinguir categorias amplas de dispositivos, mas sua unicidade é às vezes exagerada. A pesquisa de Laperdrix et al. (2016) encontrou que fingerprints de canvas sozinhos fornecem poder de distinção moderado, e seu verdadeiro valor vem da combinação com outros sinais (WebGL, propriedades do navigator, timezone) para alcançar alta unicidade.

!!! note "Injeção de Ruído no Canvas"
    Algumas ferramentas de privacidade injetam ruído aleatório na saída do canvas para quebrar o fingerprinting. Sistemas de detecção contra-atacam solicitando o fingerprint do canvas múltiplas vezes na mesma sessão. Se o hash muda entre requisições, injeção de ruído está presente, o que é em si um sinal de detecção. Randomizar a saída do canvas é, portanto, contraproducente: não previne a identificação e revela o uso de ferramentas anti-fingerprinting.

Como o Pydoll controla uma instância real do Chrome com renderização GPU real, o fingerprint de canvas é autêntico e consistente entre leituras repetidas. Nenhuma injeção ou falsificação é necessária.

## WebGL Fingerprinting

O WebGL fingerprinting estende o canvas fingerprinting para o pipeline de renderização 3D. É mais poderoso porque expõe diretamente identificadores de hardware que são difíceis de falsificar.

Os dados mais distintivos vêm da extensão `WEBGL_debug_renderer_info`, que revela o fabricante e modelo da GPU:

```javascript
function getWebGLFingerprint() {
    const canvas = document.createElement('canvas');
    const gl = canvas.getContext('webgl');
    if (!gl) return null;

    // Identificação da GPU (mais distintivo)
    const debugInfo = gl.getExtension('WEBGL_debug_renderer_info');
    const vendor = debugInfo
        ? gl.getParameter(debugInfo.UNMASKED_VENDOR_WEBGL)
        : gl.getParameter(gl.VENDOR);
    const renderer = debugInfo
        ? gl.getParameter(debugInfo.UNMASKED_RENDERER_WEBGL)
        : gl.getParameter(gl.RENDERER);

    return {
        vendor,    // ex: "Google Inc. (NVIDIA)"
        renderer,  // ex: "ANGLE (NVIDIA, NVIDIA GeForce RTX 3080 Direct3D11 vs_5_0 ps_5_0)"
        version: gl.getParameter(gl.VERSION),
        shadingLanguageVersion: gl.getParameter(gl.SHADING_LANGUAGE_VERSION),
        maxTextureSize: gl.getParameter(gl.MAX_TEXTURE_SIZE),
        extensions: gl.getSupportedExtensions(),
    };
}
```

A string do renderer nomeia diretamente o hardware da GPU. Um cliente alegando ser um dispositivo móvel mas reportando uma GPU desktop é obviamente inconsistente. Máquinas virtuais frequentemente reportam renderizadores de software como "SwiftShader" ou "llvmpipe", que usuários reais quase nunca têm.

Além de metadados, o WebGL pode renderizar uma cena 3D (um triângulo gradiente, por exemplo) e fazer hash da saída de pixels, produzindo um fingerprint de renderização análogo ao canvas fingerprinting mas no pipeline 3D. A combinação de identificadores de GPU, extensões suportadas, limites de parâmetros (`MAX_TEXTURE_SIZE`, `MAX_VIEWPORT_DIMS`) e formatos de precisão de shader cria um fingerprint detalhado da pilha gráfica.

## AudioContext Fingerprinting

A Web Audio API gera fingerprints processando áudio e medindo a saída. A técnica padrão cria um `OscillatorNode`, roteia através de um `DynamicsCompressorNode`, e lê as amostras de áudio resultantes de um `AnalyserNode` ou `OfflineAudioContext`. Diferenças nas implementações de processamento de áudio entre navegadores e pilhas de áudio do SO produzem saída distinta.

```javascript
function getAudioFingerprint() {
    const ctx = new OfflineAudioContext(1, 44100, 44100);
    const oscillator = ctx.createOscillator();
    oscillator.type = 'triangle';
    oscillator.frequency.setValueAtTime(10000, ctx.currentTime);

    const compressor = ctx.createDynamicsCompressor();
    compressor.threshold.setValueAtTime(-50, ctx.currentTime);
    compressor.knee.setValueAtTime(40, ctx.currentTime);
    compressor.ratio.setValueAtTime(12, ctx.currentTime);
    compressor.attack.setValueAtTime(0, ctx.currentTime);
    compressor.release.setValueAtTime(0.25, ctx.currentTime);

    oscillator.connect(compressor);
    compressor.connect(ctx.destination);
    oscillator.start(0);

    return ctx.startRendering().then(buffer => {
        const data = buffer.getChannelData(0);
        // Hash de um subconjunto das amostras de áudio
        let hash = 0;
        for (let i = 4500; i < 5000; i++) {
            hash += Math.abs(data[i]);
        }
        return hash;
    });
}
```

O AudioContext fingerprinting é menos amplamente implantado que canvas ou WebGL fingerprinting, mas adiciona outra dimensão ao fingerprint geral. O sinal é particularmente útil para distinguir navegadores no mesmo SO, já que o processamento de áudio varia mais entre motores de navegador do que entre versões de SO.

## Battery Status API

A Battery Status API (`navigator.getBattery()`) expõe o nível de bateria do dispositivo, status de carregamento e tempos estimados de carga/descarga. Esses valores criam um fingerprint de curta duração mas único para a duração de uma sessão.

Esta API só está disponível em navegadores Chromium. O Firefox a removeu na versão 52 (2017) citando preocupações de privacidade, e o Safari nunca a implementou. Sistemas de detecção que veem resultados da Battery API de um cliente alegando ser Firefox ou Safari sabem que o cliente está representando falsamente sua identidade.

## Fingerprinting de Cabeçalhos HTTP

Além de APIs JavaScript, cabeçalhos HTTP fornecem sinais de fingerprinting visíveis ao servidor antes de qualquer JavaScript executar.

### Ordem dos Cabeçalhos

Navegadores enviam cabeçalhos HTTP em uma ordem consistente e específica por versão. O Chrome coloca cabeçalhos `Sec-CH-UA` cedo, antes de `User-Agent`. O Firefox lidera com `User-Agent` seguido por `Accept` e `Accept-Language`. Bibliotecas HTTP automatizadas como `requests` ou `httpx` do Python enviam cabeçalhos em outra ordem, tipicamente começando com `Host` e `Connection`.

Sistemas de detecção registram a ordem dos primeiros 10-15 cabeçalhos e comparam contra assinaturas de navegadores conhecidos. Mesmo que todos os valores de cabeçalho individuais estejam corretos, enviá-los na ordem errada revela que a requisição não foi gerada pelo navegador declarado. Como o Pydoll controla uma instância real do Chrome, a ordem dos cabeçalhos é autêntica.

### Accept-Encoding

Navegadores modernos suportam compressão Brotli (`br`) além de `gzip` e `deflate`. O Chrome também suporta `zstd`. O `Accept-Encoding` do Chrome moderno se parece com `gzip, deflate, br, zstd`. Um cliente alegando ser Chrome mas sem Brotli é desatualizado ou automatizado.

### Consistência de Accept-Language

O cabeçalho `Accept-Language` deve ser consistente com `navigator.language`, `navigator.languages`, o timezone e a geolocalização do IP. Uma requisição com `Accept-Language: en-US` de um IP em Tóquio com timezone `Asia/Tokyo` é plausível para um viajante mas suspeita em combinação com outros sinais. Uma requisição com `Accept-Language: zh-CN` e timezone `America/New_York` de um IP de datacenter chinês é um forte indicador de proxy.

## Implicações para o Pydoll

Porque o Pydoll controla um navegador Chromium real através do CDP, todos os fingerprints de nível de navegador são autênticos por padrão. Os fingerprints de canvas, WebGL e AudioContext vêm de hardware real de GPU e áudio. As propriedades do navigator, plugins e dimensões de tela refletem o estado real do navegador. Cabeçalhos HTTP, incluindo sua ordem, são gerados pela pilha de rede do Chrome.

O principal risco na automação é inconsistência entre camadas. Definir um User-Agent personalizado sem sincronizar propriedades relacionadas cria incompatibilidades trivialmente detectáveis. O Pydoll lida com isso automaticamente: quando detecta `--user-agent=` nos argumentos do navegador, usa `Emulation.setUserAgentOverride` para sincronizar a string User-Agent, plataforma e metadados completos de Client Hints em todas as camadas. Também injeta sobrescritas de `navigator.vendor` e `navigator.appVersion` via `Page.addScriptToEvaluateOnNewDocument` para garantir consistência em abas recém-abertas.

Para consistência de timezone e geolocalização (para corresponder à localização do IP do proxy), sobrescritas JavaScript podem definir `Intl.DateTimeFormat().resolvedOptions().timeZone` e `Date.prototype.getTimezoneOffset`. A flag `--lang` e `set_accept_languages()` configuram cabeçalhos de idioma. A opção `webrtc_leak_protection` previne que o WebRTC exponha o IP real por trás de um proxy.

O princípio geral é que o Pydoll fornece o fingerprint autêntico do navegador como linha de base, e o desenvolvedor só precisa garantir que as camadas configuráveis (User-Agent, timezone, idioma, geolocalização) sejam consistentes entre si e com as características do proxy.

## Referências

- Laperdrix, P., Rudametkin, W., & Baudry, B. (2016). Beauty and the Beast: Diverting Modern Web Browsers to Build Unique Browser Fingerprints. IEEE S&P.
- Mowery, K., & Shacham, H. (2012). Pixel Perfect: Fingerprinting Canvas in HTML5. USENIX Security.
- Eckersley, P. (2010). How Unique Is Your Web Browser? Privacy Enhancing Technologies Symposium.
- W3C Client Hints Infrastructure: https://wicg.github.io/client-hints-infrastructure/
- BrowserLeaks: https://browserleaks.com/
- CreepJS: https://abrahamjuliot.github.io/creepjs/


================================================
FILE: docs/pt/deep-dive/fingerprinting/evasion-techniques.md
================================================
# Técnicas de Evasão

Este documento cobre técnicas práticas para evadir detecção de fingerprinting usando o Pydoll. As seções anteriores descreveram como a detecção funciona em cada camada: [network fingerprinting](./network-fingerprinting.md) (TCP/IP, TLS, HTTP/2), [browser fingerprinting](./browser-fingerprinting.md) (Canvas, WebGL, propriedades do navigator) e [behavioral fingerprinting](./behavioral-fingerprinting.md) (mouse, teclado, scroll). Esta seção foca em contramedidas.

O princípio central é consistência entre camadas. Passar em uma camada de detecção enquanto falha em outra ainda resulta em sinalização. Um IP residencial com um fingerprint TCP incompatível, ou um fingerprint de navegador perfeito com movimentos de mouse robóticos, será detectado por qualquer sistema que correlacione sinais.

!!! info "Navegação do Módulo"
    - [Network Fingerprinting](./network-fingerprinting.md): Identificação em nível de protocolo
    - [Browser Fingerprinting](./browser-fingerprinting.md): Detecção na camada de aplicação
    - [Behavioral Fingerprinting](./behavioral-fingerprinting.md): Análise de comportamento humano

## O que o Pydoll Fornece por Padrão

Antes de configurar qualquer coisa, é útil entender o que o Pydoll te dá gratuitamente ao usar uma instância real do Chrome via CDP.

**Fingerprints de rede autênticos.** A pilha TCP/IP do Chrome, implementação TLS (BoringSSL) e pilha HTTP/2 produzem fingerprints genuínos. O TLS ClientHello, frame HTTP/2 SETTINGS, ordem de pseudo-cabeçalhos e prioridades de stream correspondem a um navegador Chrome real. Ferramentas que constroem requisições HTTP programaticamente (requests, httpx, curl) produzem fingerprints não-navegador nessas camadas. Com o Pydoll, eles são autênticos por padrão.

**Fingerprints de navegador autênticos.** Fingerprints de Canvas, WebGL e AudioContext vêm de hardware real de GPU e áudio. Propriedades do navigator, plugins (os 5 plugins PDF padrão) e tipos MIME refletem estado genuíno do navegador. Não há nada para configurar aqui.

**Sem `navigator.webdriver`.** Selenium, Playwright e Puppeteer definem `navigator.webdriver` como `true`. O Pydoll usa CDP diretamente, que não define esta flag. A propriedade é `undefined`, correspondendo a uma sessão normal de usuário.

**Sequências de eventos completas.** Quando o Pydoll despacha eventos de entrada através do domínio Input do CDP, o Chrome gera a cadeia completa de eventos (pointermove, pointerdown, mousedown, pointerup, mouseup, click) exatamente como faria para entrada real do usuário.

## Consistência de User-Agent

A inconsistência de fingerprinting mais comum em automação é uma incompatibilidade entre o cabeçalho HTTP `User-Agent`, `navigator.userAgent` no JavaScript, `navigator.platform` e cabeçalhos Client Hints (`Sec-CH-UA`, `Sec-CH-UA-Platform`). Definir `--user-agent=` como flag do Chrome apenas muda o cabeçalho HTTP, deixando propriedades JavaScript e Client Hints inalterados.

O Pydoll resolve isso automaticamente. Quando detecta `--user-agent=` nos argumentos do navegador, ele:

1. Analisa a string UA para extrair nome do navegador, versão e SO.
2. Chama `Emulation.setUserAgentOverride` via CDP com o `userAgent` completo, o valor correto de `platform` (ex: `Win32` para Windows) e `userAgentMetadata` completo (dados de Client Hints incluindo `Sec-CH-UA`, `Sec-CH-UA-Platform`, `Sec-CH-UA-Full-Version-List`).
3. Injeta sobrescritas de `navigator.vendor` e `navigator.appVersion` via `Page.addScriptToEvaluateOnNewDocument`, garantindo consistência mesmo em abas recém-abertas.

```python
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.add_argument(
    '--user-agent=Mozilla/5.0 (Windows NT 10.0; Win64; x64) '
    'AppleWebKit/537.36 (KHTML, like Gecko) '
    'Chrome/120.0.6099.109 Safari/537.36'
)

async with Chrome(options=options) as browser:
    tab = await browser.start()
    # Todas as camadas agora são consistentes:
    # - Cabeçalho HTTP User-Agent
    # - navigator.userAgent / navigator.platform / navigator.appVersion
    # - Sec-CH-UA / Sec-CH-UA-Platform / Sec-CH-UA-Full-Version-List
    # - navigator.userAgentData.brands / .platform
    await tab.go_to('https://example.com')
```

Essa sobrescrita é aplicada automaticamente à aba inicial, novas abas de `browser.new_tab()`, e quaisquer abas descobertas via `browser.get_opened_tabs()`.

!!! note "Plataformas Suportadas"
    O parser de UA lida com Chrome, Edge, Windows (NT 6.1 até 10.0), macOS, Linux, Android, iOS e Chrome OS. Ele gera valores de marca GREASE adequados seguindo a especificação do Chromium.

## Consistência de Timezone e Locale

Ao usar um proxy, o timezone e idioma do navegador devem corresponder à localização geográfica do IP do proxy. Um IP geolocalizado em Tóquio com timezone `America/New_York` e `Accept-Language: en-US` é uma inconsistência detectável.

### Configuração de Idioma

O idioma é configurado através de flags do Chrome e da API de opções do Pydoll:

```python
options = ChromiumOptions()
options.add_argument('--lang=ja-JP')
options.set_accept_languages('ja-JP,ja;q=0.9,en;q=0.8')
```

Isso define tanto o cabeçalho HTTP `Accept-Language` quanto `navigator.language` / `navigator.languages`.

### Sobrescrita de Timezone

O Pydoll atualmente não encapsula o comando `Emulation.setTimezoneOverride` do CDP, então a sobrescrita de timezone requer injeção de JavaScript. As APIs críticas para sobrescrever são `Intl.DateTimeFormat().resolvedOptions().timeZone` e `Date.prototype.getTimezoneOffset()`:

```python
async def set_timezone(tab, timezone_id: str, offset_minutes: int):
    """
    Sobrescreve timezone via JavaScript.

    Args:
        timezone_id: Nome de timezone IANA (ex: 'Asia/Tokyo')
        offset_minutes: Offset UTC em minutos (ex: -540 para JST)
    """
    script = f'''
        const _origDTF = Intl.DateTimeFormat;
        Intl.DateTimeFormat = function(...args) {{
            const opts = args[1] || {{}};
            opts.timeZone = '{timezone_id}';
            return new _origDTF(args[0], opts);
        }};
        Object.defineProperty(Intl.DateTimeFormat, 'prototype', {{
            value: _origDTF.prototype
        }});
        Date.prototype.getTimezoneOffset = function() {{ return {offset_minutes}; }};
    '''
    await tab.execute_script(script)
```

!!! warning "`execute_script` vs `addScriptToEvaluateOnNewDocument`"
    `tab.execute_script()` executa JavaScript no contexto da página atual. Se a página navegar, a sobrescrita é perdida. Para sobrescritas que devem persistir entre navegações, use `Page.addScriptToEvaluateOnNewDocument` do CDP, que injeta o script antes de qualquer JavaScript da página executar em cada novo carregamento de documento. O Pydoll usa isso internamente para sobrescritas de User-Agent. Para timezone, você pode enviar o comando CDP diretamente:

    ```python
    await tab._connection_handler.execute_command(
        'Page.addScriptToEvaluateOnNewDocument',
        {'source': script}
    )
    ```

### Sobrescrita de Geolocalização

Para sites que solicitam permissão de geolocalização, a API de Geolocation pode ser sobrescrita via JavaScript:

```python
async def set_geolocation(tab, latitude: float, longitude: float):
    script = f'''
        navigator.geolocation.getCurrentPosition = function(success) {{
            success({{
                coords: {{
                    latitude: {latitude}, longitude: {longitude},
                    accuracy: 1, altitude: null, altitudeAccuracy: null,
                    heading: null, speed: null
                }},
                timestamp: Date.now()
            }});
        }};
        navigator.geolocation.watchPosition = function(success) {{
            return navigator.geolocation.getCurrentPosition(success);
        }};
    '''
    await tab.execute_script(script)
```

## Proteção contra Vazamento WebRTC

O WebRTC pode expor o endereço IP real do cliente mesmo ao usar um proxy, através de requisições a servidores STUN/TURN que ignoram o túnel do proxy. O Pydoll fornece uma opção integrada para prevenir isso:

```python
options = ChromiumOptions()
options.webrtc_leak_protection = True
# Adiciona: --force-webrtc-ip-handling-policy=disable_non_proxied_udp
```

Isso força o Chrome a rotear todo o tráfego WebRTC através do proxy, prevenindo vazamento de IP. Deve ser habilitado sempre que usar um proxy para automação stealth.

## Humanização Comportamental

O Pydoll implementa interações humanizadas para mouse, teclado e scroll através do parâmetro `humanize=True`. Estes não são recursos futuros ou soluções manuais; estão integrados ao framework.

### Mouse

```python
# Clique humanizado: caminho com curva Bezier, tempo pela Lei de Fitts,
# velocidade de jerk mínimo, tremor, overshoot + correção
await element.click(humanize=True)
```

Quando `humanize=True` é passado para o `click()` de um WebElement, o Pydoll gera um movimento completo do mouse da posição atual do cursor até o elemento usando uma curva Bezier cúbica com pontos de controle aleatorizados. A velocidade segue um perfil de jerk mínimo. Tremor fisiológico, overshoot (70% de probabilidade) e micro-pausas são adicionados. A duração do movimento é calculada pela Lei de Fitts baseada na distância e tamanho do alvo. Veja [Behavioral Fingerprinting](./behavioral-fingerprinting.md#humanização-de-mouse-do-pydoll) para descrições detalhadas dos parâmetros.

### Teclado

```python
# Digitação humanizada: atrasos variáveis, erros realistas (~2%),
# pausas de pontuação, pausas de pensamento, pausas de distração
await element.type_text("Hello, world!", humanize=True)
```

A digitação humanizada usa atrasos inter-tecla variáveis (distribuição uniforme de 30-120ms), pausas de pontuação, pausas de pensamento (2% de probabilidade), pausas de distração (0.5% de probabilidade) e erros de digitação realistas com cinco tipos de erro distintos e sequências de correção naturais. Veja [Behavioral Fingerprinting](./behavioral-fingerprinting.md#humanização-de-teclado-do-pydoll) para o detalhamento completo dos parâmetros.

### Scroll

```python
from pydoll.interactions.scroll import Scroll, ScrollPosition

scroll = Scroll(connection_handler)
# Scroll humanizado: easing Bezier, jitter, micro-pausas, overshoot
await scroll.by(ScrollPosition.Y, 800, humanize=True)
```

O scroll humanizado usa curvas de easing Bezier, jitter por frame (±3px), micro-pausas (5% de probabilidade) e correção de overshoot (15% de probabilidade). Grandes distâncias são divididas em múltiplos gestos de "flick". Veja [Behavioral Fingerprinting](./behavioral-fingerprinting.md#humanização-de-scroll-do-pydoll) para detalhes.

## Interceptação de Requisições

O Pydoll suporta interceptação de requisições via domínio Fetch do CDP, permitindo modificar cabeçalhos, bloquear requisições ou fornecer respostas personalizadas antes que cheguem ao servidor:

```python
from pydoll.protocol.fetch.events import FetchEvent

async def handle_request(event):
    request_id = event['params']['requestId']
    request = event['params']['request']
    headers = request.get('headers', {})

    # Exemplo: garantir que suporte a Brotli é anunciado
    if 'Accept-Encoding' in headers and 'br' not in headers['Accept-Encoding']:
        headers['Accept-Encoding'] = 'gzip, deflate, br, zstd'

    header_list = [{'name': k, 'value': v} for k, v in headers.items()]
    await tab.continue_request(request_id=request_id, headers=header_list)

await tab.enable_fetch_events()
await tab.on(FetchEvent.REQUEST_PAUSED, handle_request)
```

Na prática, modificação de cabeçalhos é raramente necessária com o Pydoll porque o Chrome gera cabeçalhos corretos nativamente. A interceptação de requisições é mais útil para bloquear scripts de rastreamento, modificar conteúdo de resposta ou depuração.

## Preferências do Navegador para Realismo

O Chrome armazena preferências do usuário que sistemas de fingerprinting podem inspecionar. Um perfil de navegador novo sem histórico, sem preferências salvas e tudo padrão parece diferente de um perfil que foi usado por semanas. A opção `browser_preferences` do Pydoll permite pré-popular estas:

```python
import time

options = ChromiumOptions()
options.browser_preferences = {
    'profile': {
        'created_by_version': '120.0.6099.130',
        'creation_time': str(time.time() - 90 * 86400),  # 90 dias atrás
        'exit_type': 'Normal',
    },
    'profile.default_content_setting_values': {
        'cookies': 1,
        'images': 1,
        'javascript': 1,
        'notifications': 2,  # "Perguntar" (padrão realista)
    },
}
```

## Erros Comuns

### Randomizar Tudo

Gerar um fingerprint aleatório do zero (hardwareConcurrency aleatório, deviceMemory aleatório, tamanho de tela aleatório) cria combinações impossíveis. Dispositivos reais têm configurações restritas: uma máquina de 4 núcleos com 8 GB de RAM, tela 1920x1080 e Windows 10 é um perfil plausível. Uma máquina de 17 núcleos com 0.5 GB de RAM, tela 3840x2160 e `navigator.platform: Linux armv7l` não é. Use perfis capturados de navegadores reais em vez de geração aleatória.

### Injeção de Ruído no Canvas

Adicionar ruído aleatório à saída do canvas para prevenir fingerprinting é contraproducente. Sistemas de detecção solicitam o fingerprint múltiplas vezes. Se o hash muda entre requisições, injeção de ruído é detectada, o que é em si um sinal forte de automação. Com o Pydoll, o fingerprint de canvas é autêntico e consistente. Deixe-o como está.

### User-Agents Desatualizados

Usar um User-Agent de uma versão de navegador com 6+ meses é detectável porque a versão carece de recursos e valores de Client Hints que a versão atual teria. Mantenha strings de User-Agent atuais dentro das últimas 2-3 versões principais do Chrome.

### Ignorar Comportamento em Nível de Sessão

Mesmo com fingerprints perfeitos e interações humanizadas, o comportamento em nível de sessão importa. Carregar 100 páginas em 60 segundos, nunca scrollar, clicar apenas em botões (nunca links) e manter foco constante por horas sem uma única troca de aba ou período ocioso são todas anomalias comportamentais. Adicione atrasos de leitura entre navegações, varie o ritmo de workflows de múltiplas páginas e inclua períodos naturais de inatividade.

## Verificação

Antes de implantar automação em escala, verifique seu fingerprint usando estas ferramentas:

| Ferramenta | URL | Testes |
|------|-----|-------|
| BrowserLeaks | https://browserleaks.com/ | Canvas, WebGL, fontes, IP, WebRTC, HTTP/2 |
| CreepJS | https://abrahamjuliot.github.io/creepjs/ | Detecção de mentiras, verificações de consistência |
| Fingerprint.com | https://fingerprint.com/demo/ | Identificação de nível comercial |
| PixelScan | https://pixelscan.net/ | Análise de detecção de bots |
| IPLeak | https://ipleak.net/ | WebRTC, DNS, vazamentos de IP |

Um script básico de verificação com o Pydoll:

```python
async def verify_fingerprint(tab):
    result = await tab.execute_script('''
        return {
            userAgent: navigator.userAgent,
            platform: navigator.platform,
            webdriver: navigator.webdriver,
            languages: navigator.languages,
            plugins: navigator.plugins.length,
            timezone: Intl.DateTimeFormat().resolvedOptions().timeZone,
            colorDepth: screen.colorDepth,
            deviceMemory: navigator.deviceMemory,
            hardwareConcurrency: navigator.hardwareConcurrency,
        };
    ''')
    fp = result['result']['result']['value']

    # Verificar problemas óbvios
    assert fp['webdriver'] is None, 'navigator.webdriver deveria ser undefined'
    assert fp['plugins'] == 5, f'Esperados 5 plugins, obtidos {fp["plugins"]}'
    assert 'HeadlessChrome' not in fp['userAgent'], 'Headless detectado no UA'
```

## Referências

- Chrome DevTools Protocol, Emulation Domain: https://chromedevtools.github.io/devtools-protocol/tot/Emulation/
- Chrome DevTools Protocol, Fetch Domain: https://chromedevtools.github.io/devtools-protocol/tot/Fetch/
- Chromium Source, Inspector Emulation Agent: https://source.chromium.org/chromium/chromium/src/+/main:third_party/blink/renderer/core/inspector/inspector_emulation_agent.cc


================================================
FILE: docs/pt/deep-dive/fingerprinting/index.md
================================================
# Análise Profunda de Fingerprinting de Navegador e Rede

Este módulo cobre fingerprinting de navegador e rede, um aspecto crítico dos sistemas modernos de automação web e detecção.

O fingerprinting situa-se na interseção de protocolos de rede, criptografia, componentes internos do navegador e análise comportamental. Ele engloba as técnicas usadas para identificar e rastrear dispositivos, navegadores e usuários através de sessões sem depender de identificadores tradicionais como cookies ou endereços IP.

## Por que Isso Importa

Cada conexão de navegador a um site expõe múltiplas características, desde a ordem precisa das opções TCP em pacotes de rede, até a renderização de canvas específica da GPU, e padrões de tempo de execução de JavaScript. Individualmente, essas características podem parecer inócuas. Combinadas, elas criam um fingerprint (impressão digital) que pode identificar unicamente um dispositivo ou instância de navegador.

Para engenheiros de automação, desenvolvedores de bots e usuários conscientes da privacidade, entender o fingerprinting é essencial para construir sistemas eficazes de evasão de detecção e para compreender como os mecanismos de rastreamento operam em um nível técnico.

!!! danger "Sistemas de Detecção Multi-Camada"
    Sistemas anti-bot modernos empregam análise abrangente em múltiplas camadas:
    
    - **Nível de Rede**: Comportamento da pilha TCP/IP, padrões de handshake TLS, configurações HTTP/2
    - **Nível de Navegador**: Renderização de Canvas, strings de fornecedor WebGL, enumeração de propriedades JavaScript
    - **Comportamental**: Entropia de movimento do mouse, tempo de digitação, padrões de rolagem
    
    Uma única inconsistência (como um User-Agent do Chrome com um fingerprint TLS do Firefox) pode disparar um bloqueio imediato.

## Escopo e Metodologia do Módulo

Técnicas de fingerprinting estão documentadas em múltiplas fontes com níveis variados de acessibilidade e confiabilidade:

- Artigos acadêmicos (frequentemente com acesso pago e teóricos)
- Código-fonte de navegadores (milhões de linhas para analisar)
- Blogs de pesquisadores de segurança (técnicos, mas fragmentados)
- Whitepapers de fornecedores anti-bot (focados em marketing, detalhes omitidos)
- Fóruns underground (práticos, mas não confiáveis)

Este módulo centraliza, valida e organiza esse conhecimento em um guia técnico coeso. Cada técnica descrita aqui foi:

- **Verificada** contra código-fonte de navegadores e RFCs
- **Testada** em cenários reais de automação
- **Citada** com referências de autoridade
- **Explicada** desde os primeiros princípios até a implementação

## Estrutura do Módulo

Este módulo é organizado em três camadas progressivas, desde fundamentos de rede até técnicas práticas de evasão:

### 1. Fingerprinting em Nível de Rede
**[Network Fingerprinting (Fingerprinting de Rede)](./network-fingerprinting.md)**

Cobre a identificação de dispositivos através do comportamento de rede nas camadas de transporte e sessão, antes que a renderização do navegador comece.

- **Fingerprinting de TCP/IP**: TTL, tamanho da janela, ordenação de opções
- **Fingerprinting de TLS**: JA3/JA4, suítes de cifras, negociação ALPN
- **Fingerprinting de HTTP/2**: Frames SETTINGS, padrões de prioridade
- **Ferramentas e técnicas**: p0f, Nmap, Scapy, análise tshark

**Significância técnica**: Fingerprints de rede são os mais desafiadores de falsificar (spoof) porque exigem modificações em nível de SO. Inconsistências nesta camada são detectadas antes que a execução de JavaScript comece.

### 2. Fingerprinting em Nível de Navegador
**[Browser Fingerprinting (Fingerprinting de Navegador)](./browser-fingerprinting.md)**

Examina a identificação do navegador através de APIs JavaScript, motores de renderização e ecossistemas de plugins na camada de aplicação.

- **Fingerprinting de Canvas e WebGL**: Artefatos de renderização específicos da GPU
- **Fingerprinting de Áudio**: Diferenças sutis na saída da API de áudio
- **Enumeração de Fontes**: Fontes instaladas revelam SO e localidade
- **Propriedades JavaScript**: Objeto Navigator, dimensões da tela, fuso horário
- **Análise de Cabeçalhos**: Consistência de Accept-Language, User-Agent

**Significância técnica**: Esta camada é responsável pela maioria dos eventos de detecção. Mesmo com fingerprints de nível de rede corretos, propriedades de automação expostas (ex: `navigator.webdriver`) podem disparar o bloqueio.

### 3. Fingerprinting Comportamental
**[Behavioral Fingerprinting (Fingerprinting Comportamental)](./behavioral-fingerprinting.md)**

Analisa padrões de interação do usuário para distinguir comportamento humano de sistemas automatizados.

- **Análise de movimento do mouse**: Curvatura da trajetória, perfis de velocidade, conformidade com a Lei de Fitts
- **Dinâmica de teclado**: Ritmo de digitação, tempo de permanência (dwell time), tempo de voo (flight time), padrões de bigramas
- **Padrões de rolagem**: Momentum, inércia, curvas de desaceleração
- **Sequências de eventos**: Ordem natural de interação (mousemove → click), análise de tempo
- **Machine learning**: Modelos de ML treinados em bilhões de sinais comportamentais

**Significância técnica**: A análise comportamental pode detectar automação mesmo quando os fingerprints de rede e navegador estão corretamente falsificados. Esta camada é particularmente desafiadora porque requer a replicação de padrões de comportamento biomecânico humano.

### 4. Técnicas de Evasão
**[Evasion Techniques (Técnicas de Evasão)](./evasion-techniques.md)**

Implementação prática de evasão de fingerprinting usando a integração CDP do Pydoll, sobrescritas de JavaScript e recursos arquitetônicos.

- **Falsificação (Spoofing) baseada em CDP**: Fuso horário, geolocalização, métricas do dispositivo
- **Sobrescrita de propriedades JavaScript**: Redefinindo objetos navigator, envenenamento de canvas (canvas poisoning)
- **Interceptação de requisições**: Forçando consistência de cabeçalhos
- **Imitação comportamental**: Tempo semelhante ao humano, injeção de entropia
- **Testes de detecção**: Ferramentas para validar sua configuração de evasão

**Significância técnica**: Esta seção demonstra a aplicação prática de conceitos de fingerprinting em cenários reais de automação, integrando técnicas de todas as camadas anteriores.

## Quem Deve Ler Isto

### **Você DEVE ler isto se você está:**
- Construindo automação que interage com sites protegidos por anti-bots
- Desenvolvendo infraestrutura de scraping em escala
- Implementando automação de navegador que preserva a privacidade
- Pesquisando detecção de bots para fins ofensivos ou defensivos

### **Isto é material avançado se você:**
- É novo em protocolos de rede (comece com [Fundamentos de Rede](../network/network-fundamentals.md))
- Não está familiarizado com CDP (leia [Chrome DevTools Protocol](../fundamentals/cdp.md) primeiro)
- Está apenas aprendendo tipagem em Python (veja [Sistema de Tipos](../fundamentals/typing-system.md))

### **Isto NÃO é:**
- Uma "bala de prata" como solução anti-detecção (tal coisa não existe)
- Aconselhamento jurídico sobre web scraping (consulte [Legal e Ético](../network/proxy-legal.md))
- Um substituto para respeitar o robots.txt e limites de taxa (rate limits)

## A Filosofia Técnica

A defesa contra fingerprinting **não é sobre se tornar invisível** — é sobre se tornar **indistinguível do tráfego legítimo**. Isso significa:

1.  **Consistência acima da perfeição**: Um fingerprint de Firefox perfeitamente configurado é melhor que um fingerprint "perfeito" mas inconsistente do Chrome
2.  **Abordagem holística**: Você deve alinhar as camadas de rede, navegador e comportamental
3.  **Adaptação contínua**: Técnicas de fingerprinting evoluem mensalmente; este é um documento vivo

!!! tip "A Regra de Ouro"
    **Cada camada deve contar a mesma história.** Se seu fingerprint TLS diz "Chrome 120", suas configurações HTTP/2 devem corresponder ao Chrome 120, seu User-Agent deve dizer Chrome 120, e sua renderização de canvas deve produzir artefatos do Chrome 120. Um desencontro = detecção.

## Considerações Éticas

O conhecimento sobre fingerprinting é **tecnologia de uso dual**:

- **Defensivo**: Proteger sua privacidade de rastreamento invasivo
- **Ofensivo**: Evadir sistemas de detecção para automação

Confiamos que você usará este conhecimento de forma **responsável e ética**:

**Práticas recomendadas:**
- Respeitar os termos de serviço dos sites
- Implementar limitação de taxa (rate limiting) e padrões de rastreamento respeitosos
- Avaliar se a automação é necessária
- Ser transparente quando apropriado

**Usos proibidos:**
- Fraude, abuso de contas ou atividades ilegais
- Sobrecarregar servidores com scraping agressivo
- Usar este conhecimento como arma sem entender as consequências

## Pronto para Mergulhar Fundo?

Fingerprinting é um domínio complexo e técnico que requer estudo sistemático. Entender essas técnicas é essencial para automação web eficaz em ambientes com sistemas de detecção.

Comece com **[Network Fingerprinting (Fingerprinting de Rede)](./network-fingerprinting.md)** para estabelecer conhecimento fundamental, continue com **[Browser Fingerprinting (Fingerprinting de Navegador)](./browser-fingerprinting.md)** para entendimento da camada de aplicação, e conclua com **[Evasion Techniques (Técnicas de Evasão)](./evasion-techniques.md)** para implementação prática.

---

!!! info "Status da Documentação"
    Este módulo representa **pesquisa extensiva** combinando artigos acadêmicos, código-fonte de navegadores, testes do mundo real e conhecimento da comunidade. Cada alegação é citada e validada. Se você encontrar imprecisões ou tiver atualizações, contribuições são bem-vindas.

## Leitura Adicional

Antes de mergulhar, considere estes tópicos complementares:

- **[Arquitetura de Proxy](../network/http-proxies.md)**: Fundamentos de anonimato em nível de rede
- **[Preferências do Navegador](../../features/configuration/browser-preferences.md)**: Configuração prática de fingerprint
- **[Contorno de Captcha Comportamental](../../features/advanced/behavioral-captcha-bypass.md)**: Análise e evasão comportamental

================================================
FILE: docs/pt/deep-dive/fingerprinting/network-fingerprinting.md
================================================
# Network Fingerprinting

O network fingerprinting identifica clientes analisando características da pilha TCP/IP, handshake TLS e conexão HTTP/2. Esses sinais são definidos pelo kernel do sistema operacional e pela biblioteca TLS, não pelo ambiente JavaScript do navegador, o que os torna mais difíceis de falsificar que fingerprints de nível de navegador. Um proxy ou VPN muda seu endereço IP mas não altera seu tamanho de janela TCP, sua lista de cipher suites TLS ou seu frame HTTP/2 SETTINGS. Sistemas de detecção exploram essa lacuna.

!!! info "Navegação do Módulo"
    - [Browser Fingerprinting](./browser-fingerprinting.md): Canvas, WebGL, AudioContext
    - [Técnicas de Evasão](./evasion-techniques.md): Contramedidas multi-camada

    Para fundamentos de protocolo, veja [Fundamentos de Rede](../network/network-fundamentals.md). Para contexto de detecção de proxy, veja [Detecção de Proxy](../network/proxy-detection.md).

## TCP/IP Fingerprinting

Cada sistema operacional implementa a pilha TCP/IP de forma diferente. O pacote SYN que inicia uma conexão TCP carrega informação suficiente para identificar o SO com alta confiança: o TTL inicial, o tamanho da janela TCP, o Maximum Segment Size e a ordem e seleção de opções TCP. Nenhum desses valores é controlado pelo navegador. Eles vêm do kernel.

### TTL (Time To Live)

O TTL inicial é um dos identificadores de SO mais simples. Linux e macOS definem como 64, Windows define como 128, e dispositivos de rede (roteadores, firewalls) tipicamente usam 255. Cada salto de roteador decrementa o TTL em um, então um pacote chegando com TTL 118 provavelmente começou em 128 (Windows) e cruzou 10 saltos.

O valor de fingerprinting do TTL vem da referência cruzada com o User-Agent. Se o navegador alega ser Chrome no Windows mas o pacote chega com TTL próximo de 64, a conexão está ou sendo proxy através de um servidor Linux ou o User-Agent está falsificado. Sistemas de detecção arredondam o TTL observado para cima até o valor inicial conhecido mais próximo (64, 128, 255) e comparam contra o SO declarado.

Quando o tráfego flui através de um proxy, o TTL reinicia porque o kernel do proxy gera uma nova conexão TCP para o destino. O destino vê o TTL do proxy, não o seu. É por isso que incompatibilidades de TTL são um sinal de detecção de proxy: o User-Agent diz Windows (TTL 128) mas o fingerprint TCP mostra Linux (TTL 64).

### Tamanho da Janela TCP e Escalonamento

O tamanho inicial da janela TCP no pacote SYN varia por SO e versão do kernel. Kernels Linux modernos (3.x e posteriores) tipicamente enviam uma janela inicial de 29200 bytes, que é `20 * MSS` onde MSS é 1460 para Ethernet padrão. Alguns kernels mais novos (5.x, 6.x) podem usar 64240 dependendo da configuração e ajustes de `initcwnd`. Windows 10 e 11 tipicamente enviam 65535 com escalonamento de janela habilitado, embora o valor exato dependa da configuração de auto-tuning e nível de patch. macOS também usa 65535 como padrão.

O fator de escala de janela (uma opção TCP) multiplica o campo de tamanho de janela de 16 bits para suportar janelas de recebimento maiores. Linux comumente usa fator de escala 7 (permitindo janelas de até 8MB), enquanto Windows frequentemente usa 8. Combinado com o tamanho base da janela, o fator de escala cria um fingerprint mais granular do que qualquer valor isolado.

### Ordem de Opções TCP

A seleção e ordenação de opções TCP no pacote SYN é altamente distintiva. Cada SO organiza as opções em uma ordem fixa e específica por versão que o kernel não expõe como parâmetro configurável. Linux envia `MSS, SACK_PERM, TIMESTAMP, NOP, WSCALE`. Windows envia `MSS, NOP, WSCALE, NOP, NOP, SACK_PERM` e notavelmente omite a opção TIMESTAMP nas configurações padrão. macOS envia `MSS, NOP, WSCALE, NOP, NOP, TIMESTAMP, SACK_PERM`.

A presença ou ausência de opções específicas importa tanto quanto a ordem. Windows historicamente omitiu timestamps TCP, que Linux e macOS incluem por padrão. SACK (Selective Acknowledgment) é suportado por todos os sistemas modernos, mas sistemas mais antigos ou embarcados podem não anunciá-lo. A combinação de quais opções aparecem e em que ordem cria uma assinatura que ferramentas como p0f comparam contra um banco de dados de fingerprints de SO conhecidos.

### p0f

[p0f](https://lcamtuf.coredump.cx/p0f3/) é a ferramenta padrão para fingerprinting TCP/IP passivo. Ele observa tráfego sem gerar nenhum pacote, analisando pacotes SYN e SYN+ACK contra um banco de dados de assinaturas. Seu formato de assinatura codifica os campos chave de fingerprinting:

```
version:ittl:olen:mss:wsize,scale:olayout:quirks:pclass
```

O `ittl` é o TTL inicial inferido, `mss` é o Maximum Segment Size, `wsize,scale` é o tamanho da janela (que pode ser absoluto, ou relativo ao MSS como `mss*20`), e `olayout` é o layout de opções TCP usando nomes abreviados (`mss`, `nop`, `ws`, `sok`, `sack`, `ts`, `eol+N`). O campo `quirks` captura comportamentos incomuns como a flag Don't Fragment (`df`) ou IP ID não-zero em pacotes DF (`id+`).

Uma assinatura típica de Linux 4.x+ no p0f se parece com `4:64:0:*:mss*20,7:mss,sok,ts,nop,ws:df,id+:0`. Uma assinatura de Windows 10 pode parecer `4:128:0:*:65535,8:mss,nop,ws,nop,nop,sok:df,id+:0`. Serviços anti-bot mantêm bancos de dados similares internamente, comparando conexões de entrada contra perfis de SO conhecidos e sinalizando incompatibilidades com o User-Agent declarado.

## TLS Fingerprinting

A mensagem TLS ClientHello é transmitida antes da criptografia ser estabelecida, então é visível para qualquer observador no caminho de rede. Ela contém a versão TLS, cipher suites suportadas, extensões TLS, curvas elípticas suportadas (named groups) e formatos de ponto EC. Cada navegador e biblioteca TLS produz uma combinação característica desses campos.

### JA3

JA3, desenvolvido na Salesforce por John Althouse, Jeff Atkinson e Josh Atkins, foi o primeiro método de fingerprinting TLS amplamente adotado. Ele concatena cinco campos do ClientHello (versão TLS, cipher suites, extensões, curvas elípticas, formatos de ponto EC), junta valores dentro de cada campo com hífens, separa os cinco campos com vírgulas e tira o hash MD5 da string resultante.

```
String JA3: 771,4865-4866-4867-49195-49199-49196-49200-52393-52392,0-23-65281-10-11-35-16-5-13-18-51-45-43-27-17513,29-23-24,0
Hash JA3:   cd08e31494b9531f560d64c695473da9
```

Uma sutileza: o campo "versão TLS" no JA3 usa `ClientHello.legacy_version`, não a extensão `supported_versions`. Como TLS 1.3 (RFC 8446) requer que clientes definam `legacy_version` como `0x0303` (TLS 1.2) para compatibilidade retroativa, o campo de versão JA3 é quase sempre `771` para clientes modernos, mesmo quando suportam TLS 1.3. A negociação real de TLS 1.3 acontece através da extensão 43 (`supported_versions`), mas o JA3 usa o campo do cabeçalho.

O JA3 deve filtrar valores GREASE antes do hashing. GREASE (RFC 8701) é um mecanismo onde navegadores inserem valores reservados selecionados aleatoriamente em cipher suites, extensões e outros campos para prevenir ossificação de protocolo. Os valores GREASE válidos são `0x0a0a`, `0x1a1a`, `0x2a2a` e assim por diante até `0xfafa`. Cada valor tem dois bytes idênticos onde o nibble inferior de cada byte é `0x0a`. Um filtro GREASE correto verifica ambas as condições:

```python
def is_grease(value: int) -> bool:
    return (value & 0x0f0f) == 0x0a0a and (value >> 8) == (value & 0xff)
```

!!! warning "Limitações do JA3 com Navegadores Modernos"
    Desde o Chrome 110 (janeiro 2023) e Firefox 114, navegadores randomizam a ordem das extensões TLS em cada conexão. Isso significa que o mesmo navegador produz hashes JA3 diferentes em cada conexão, tornando o JA3 efetivamente inútil para identificar navegadores modernos. O JA3 permanece útil para fingerprinting de clientes não-navegador (Python `requests`, `curl`, bots personalizados) que não implementam randomização de extensões.

### JA4

JA4 é o sucessor do JA3, desenvolvido pelo mesmo autor principal (John Althouse) na FoxIO. Foi projetado especificamente para sobreviver à randomização de extensões TLS ordenando extensões e cipher suites antes do hashing. O formato consiste em três seções separadas por underscores: `a_b_c`.

Seção `a` é uma string legível de metadados: o protocolo (`t` para TCP, `q` para QUIC), a versão TLS (`12` ou `13`), se SNI está presente (`d` para domínio, `i` para IP), o número de cipher suites (dois dígitos), o número de extensões (dois dígitos) e o primeiro e último valor ALPN (`h2` para HTTP/2, `00` se nenhum). Por exemplo, `t13d1516h2` significa TCP TLS 1.3 com SNI, 15 cipher suites, 16 extensões e HTTP/2 ALPN.

Seção `b` é um hash SHA-256 truncado das cipher suites ordenadas. Seção `c` é um hash SHA-256 truncado das extensões ordenadas concatenadas com os algoritmos de assinatura. Como ambas as listas são ordenadas antes do hashing, a randomização de extensões não afeta a saída.

Cloudflare, AWS e outras plataformas principais adotaram o JA4. A suíte completa JA4+ também inclui JA4S (fingerprinting de servidor), JA4H (fingerprinting de cliente HTTP), JA4X (fingerprinting de certificado X.509) e JA4SSH (fingerprinting SSH). A especificação e ferramentas estão disponíveis em [github.com/FoxIO-LLC/ja4](https://github.com/FoxIO-LLC/ja4).

### JA3S (Fingerprinting de Servidor)

JA3S aplica o mesmo conceito à mensagem ServerHello, mas o formato é mais simples porque o servidor seleciona uma única cipher suite em vez de oferecer uma lista. A string JA3S é `version,cipher,extensions` e seu hash MD5 identifica a implementação TLS do servidor. Parear JA3 (ou JA4) com JA3S cria um fingerprint bidirecional: um cliente específico conversando com um servidor específico produz um par JA3+JA3S previsível, que é mais distintivo do que qualquer fingerprint isolado.

### Como Proxies Interagem com Fingerprints TLS

O tipo de proxy determina se o fingerprint TLS é preservado. Proxies SOCKS5 e túneis HTTP CONNECT retransmitem o stream TCP sem encerrar o TLS, então o servidor destino vê o fingerprint TLS original do cliente inalterado. Esta é a principal vantagem desses tipos de proxy para consistência de fingerprint.

Proxies MITM (que encerram o TLS e reestabelecem uma nova conexão para o destino) substituem o fingerprint TLS do cliente pelo seu próprio. O destino vê as cipher suites e extensões do software proxy, não as do navegador. Se o proxy usa uma biblioteca TLS padrão como OpenSSL ou BoringSSL com configurações padrão, o fingerprint não corresponderá a nenhum navegador conhecido, o que é em si um sinal de detecção.

É por isso que a abordagem do Pydoll de usar `--proxy-server` (que cria um túnel CONNECT, preservando o fingerprint TLS do navegador) é preferível a configurações de proxy MITM externo para automação stealth.

## HTTP/2 Fingerprinting

Conexões HTTP/2 expõem um conjunto separado de sinais de fingerprinting distintos do TLS. O primeiro frame enviado pelo cliente é um frame SETTINGS contendo parâmetros como `HEADER_TABLE_SIZE`, `ENABLE_PUSH`, `MAX_CONCURRENT_STREAMS`, `INITIAL_WINDOW_SIZE`, `MAX_FRAME_SIZE` e `MAX_HEADER_LIST_SIZE`. Cada navegador usa valores padrão diferentes e inclui subconjuntos diferentes desses parâmetros.

Além do SETTINGS, o tamanho do frame WINDOW_UPDATE, a prioridade/peso do stream inicial e a ordem dos pseudo-cabeçalhos HTTP/2 (`:method`, `:authority`, `:scheme`, `:path`) variam entre implementações. Chrome, Firefox e Safari cada um produz uma combinação distintiva desses valores.

A Akamai publicou a pesquisa fundamental sobre fingerprinting HTTP/2 no Black Hat Europe 2017. Seu formato de fingerprint concatena os valores SETTINGS, tamanho do WINDOW_UPDATE, frames PRIORITY e ordem dos pseudo-cabeçalhos. A suíte JA4+ inclui `JA4H` para fingerprinting em nível HTTP, cobrindo ordem e valores de cabeçalhos.

O fingerprinting HTTP/2 é particularmente eficaz contra ferramentas de automação porque muitos frameworks de bot e bibliotecas HTTP implementam suas próprias pilhas HTTP/2 com parâmetros padrão que não correspondem a nenhum navegador real. Mesmo quando uma ferramenta falsifica corretamente o fingerprint TLS (usando curl-impersonate ou similar), seu frame HTTP/2 SETTINGS pode traí-la.

Você pode verificar seu fingerprint HTTP/2 em [browserleaks.com/http2](https://browserleaks.com/http2). Como o Pydoll controla uma instância real do Chrome via CDP, o fingerprint HTTP/2 é sempre autêntico, o que é uma vantagem inerente sobre ferramentas que constroem requisições HTTP programaticamente.

## Implicações para Automação de Navegador

A conclusão prática para automação com o Pydoll é que o network fingerprinting é uma área onde controlar um navegador real fornece uma vantagem significativa. A pilha TCP/IP do Chrome, implementação TLS (BoringSSL) e pilha HTTP/2 produzem fingerprints autênticos por padrão. O principal risco é incompatibilidade ambiental: executar o Chrome em um servidor Linux enquanto o User-Agent alega Windows cria uma inconsistência de fingerprint TCP/IP (TTL 64 ao invés de 128, ordem de opções TCP do Linux ao invés do Windows).

Para configurações baseadas em proxy, o fluxo de fingerprint é: a pilha TCP/IP da sua máquina gera a conexão para o proxy (que o operador do proxy pode ver mas o destino não), e a pilha TCP/IP do proxy gera a conexão para o destino. O destino vê o TTL e opções TCP do servidor proxy. Se o proxy roda Linux (como a maioria faz), o fingerprint TCP indicará Linux independentemente do User-Agent. Este é um sinal de detecção bem conhecido que proxies residenciais mitigam parcialmente (o endpoint do proxy é a máquina de um usuário real, então seu fingerprint TCP é plausível) mas proxies de datacenter não podem.

Os fingerprints TLS e HTTP/2, por outro lado, passam por túneis SOCKS5 e CONNECT sem modificação. Estes são os fingerprints do navegador, não do proxy. Então com o Pydoll através de um túnel CONNECT, o destino vê fingerprints TLS e HTTP/2 autênticos do Chrome pareados com o fingerprint TCP/IP do proxy. Esta combinação é consistente com um usuário real navegando através de uma VPN ou proxy corporativo, que é um padrão comum e legítimo.

## Referências

- Salesforce Engineering: TLS Fingerprinting with JA3 and JA3S - https://engineering.salesforce.com/tls-fingerprinting-with-ja3-and-ja3s-247362855967/
- FoxIO JA4+ Network Fingerprinting - https://github.com/FoxIO-LLC/ja4
- Cloudflare: JA4 Signals - https://blog.cloudflare.com/ja4-signals/
- Akamai: Passive Fingerprinting of HTTP/2 Clients (Black Hat EU 2017) - https://blackhat.com/docs/eu-17/materials/eu-17-Shuster-Passive-Fingerprinting-Of-HTTP2-Clients-wp.pdf
- p0f v3: Passive OS Fingerprinting - https://lcamtuf.coredump.cx/p0f3/
- RFC 8446: TLS 1.3 - https://datatracker.ietf.org/doc/html/rfc8446
- RFC 8701: GREASE for TLS - https://datatracker.ietf.org/doc/html/rfc8701
- RFC 6528: Defending against Sequence Number Attacks - https://datatracker.ietf.org/doc/html/rfc6528
- BrowserLeaks HTTP/2 Fingerprint - https://browserleaks.com/http2
- Stamus Networks: JA3 Fingerprints Fade as Browsers Embrace Extension Randomization - https://www.stamus-networks.com/blog/ja3-fingerprints-fade-browsers-embrace-tls-extension-randomization


================================================
FILE: docs/pt/deep-dive/fundamentals/cdp.md
================================================
# Chrome DevTools Protocol (CDP)

O Chrome DevTools Protocol (CDP) é a fundação que permite ao Pydoll controlar navegadores sem os webdrivers tradicionais. Entender como o CDP funciona fornece insights valiosos sobre as capacidades e a arquitetura interna do Pydoll.


## O que é o CDP?

O Chrome DevTools Protocol é uma interface poderosa desenvolvida pela equipe do Chromium que permite a interação programática com navegadores baseados no Chromium. É o mesmo protocolo usado pelo Chrome DevTools quando você inspeciona uma página web, mas exposto como uma API programável que pode ser aproveitada por ferramentas de automação.

Em sua essência, o CDP fornece um conjunto abrangente de métodos e eventos para interagir com os componentes internos do navegador. Isso permite um controle refinado sobre todos os aspectos do navegador, desde navegar entre páginas até manipular o DOM, interceptar requisições de rede e monitorar métricas de desempenho.

!!! info "Evolução do CDP"
    O Chrome DevTools Protocol tem evoluído continuamente desde sua introdução. O Google mantém e atualiza o protocolo a cada lançamento do Chrome, adicionando regularmente novas funcionalidades e melhorando recursos existentes.
    
    Embora o protocolo tenha sido inicialmente projetado para o DevTools do Chrome, suas capacidades abrangentes o tornaram a fundação para ferramentas de automação de navegador de próxima geração como Puppeteer, Playwright e, claro, o Pydoll.

## Comunicação via WebSocket

Uma das principais decisões arquitetônicas no CDP é o uso de WebSockets para comunicação. Quando um navegador baseado no Chromium é iniciado com a flag de depuração remota habilitada, ele abre um servidor WebSocket em uma porta especificada:

```
chrome --remote-debugging-port=9222
```

O Pydoll se conecta a este endpoint WebSocket para estabelecer um canal de comunicação bidirecional com o navegador. Esta conexão:

1.  **Permanece persistente** durante toda a sessão de automação
2.  **Habilita eventos em tempo real** do navegador para serem enviados (push) ao cliente
3.  **Permite que comandos** sejam enviados ao navegador
4.  **Suporta dados binários** para transferência eficiente de capturas de tela, PDFs e outros ativos

O protocolo WebSocket é particularmente adequado para automação de navegador porque fornece:

- **Comunicação de baixa latência** - Necessária para automação responsiva
- **Mensagens bidirecionais** - Essencial para arquitetura orientada a eventos
- **Conexões persistentes** - Eliminando a sobrecarga de configuração de conexão para cada operação

Aqui está uma visão simplificada de como funciona a comunicação do Pydoll com o navegador:

```mermaid
sequenceDiagram
    participant App as Aplicação Pydoll
    participant WS as Conexão WebSocket
    participant Browser as Navegador Chrome

    App ->> WS: Comando: navegar para URL
    WS ->> Browser: Executar navegação

    Browser -->> WS: Enviar evento de carregamento de página
    WS -->> App: Receber evento de carregamento de página
```

!!! info "WebSocket vs HTTP"
    Protocolos de automação de navegador anteriores frequentemente dependiam de endpoints HTTP para comunicação. A mudança do CDP para WebSockets representa uma melhoria arquitetônica significativa que permite automação mais responsiva e monitoramento de eventos em tempo real.
    
    Protocolos baseados em HTTP exigem "polling" (consultas periódicas) contínuo para detectar mudanças, criando sobrecarga e atrasos. WebSockets permitem que o navegador envie notificações (push) para seu script de automação exatamente quando os eventos ocorrem, com latência mínima.

## Domínios Chave do CDP

O CDP é organizado em domínios lógicos, cada um responsável por um aspecto específico da funcionalidade do navegador. Alguns dos domínios mais importantes incluem:


| Domínio | Responsabilidade | Exemplos de Casos de Uso |
|---|---|---|
| **Browser** | Controle da própria aplicação do navegador | Gerenciamento de janelas, criação de contexto de navegador |
| **Page** | Interação com o ciclo de vida da página | Navegação, execução de JavaScript, gerenciamento de frames |
| **DOM** | Acesso à estrutura da página | Seletores de consulta, modificação de atributos, ouvintes de eventos |
| **Network** | Monitoramento e controle de tráfego de rede | Interceptação de requisições, exame de respostas, cache |
| **Runtime** | Ambiente de execução JavaScript | Avaliar expressões, chamar funções, lidar com exceções |
| **Input** | Simulação de interações do usuário | Movimentos do mouse, entrada de teclado, eventos de toque |
| **Target** | Gerenciamento de contextos e alvos do navegador | Criar abas, acessar iframes, lidar com popups |
| **Fetch** | Interceptação de rede de baixo nível | Modificar requisições, simular respostas, autenticação |

O Pydoll mapeia esses domínios CDP para uma estrutura de API mais intuitiva, preservando ao mesmo tempo todas as capacidades do protocolo subjacente.

## Arquitetura Orientada a Eventos

Uma das funcionalidades mais poderosas do CDP é seu sistema de eventos. O protocolo permite que clientes se inscrevam em vários eventos que o navegador emite durante a operação normal. Esses eventos cobrem virtualmente todos os aspectos do comportamento do navegador:

- **Eventos de ciclo de vida**: Carregamentos de página, navegação de frames, criação de alvos
- **Eventos DOM**: Mudanças de elementos, modificações de atributos
- **Eventos de rede**: Ciclos de requisição/resposta, mensagens WebSocket
- **Eventos de execução**: Exceções JavaScript, mensagens do console
- **Eventos de desempenho**: Métricas de renderização, script e mais


Quando você habilita o monitoramento de eventos no Pydoll (ex: com `page.enable_network_events()`), a biblioteca configura as inscrições necessárias com o navegador e fornece "ganchos" (hooks) para seu código reagir a esses eventos.

```python
from pydoll.events.network import NetworkEvents
from functools import partial

async def on_request(page, event):
    url = event['params']['request']['url']
    print(f"Requisição para: {url}")

# Inscrever-se em eventos de requisição de rede
await page.enable_network_events()
await page.on(NetworkEvents.REQUEST_WILL_BE_SENT, partial(on_request, page))
```

Essa abordagem orientada a eventos permite que scripts de automação reajam imediatamente a mudanças de estado do navegador, sem depender de polling ineficiente ou atrasos arbitrários.

## Vantagens de Desempenho da Integração Direta com CDP

Usar o CDP diretamente, como o Pydoll faz, oferece várias vantagens de desempenho em relação à automação tradicional baseada em webdriver:

### 1. Eliminação da Camada de Tradução de Protocolo

Ferramentas tradicionais baseadas em webdriver, como o Selenium, usam uma abordagem multicamada:

```mermaid
graph LR
    AS[Script de Automação] --> WC[Cliente WebDriver]
    WC --> WS[Servidor WebDriver]
    WS --> B[Navegador]
```

Cada camada adiciona sobrecarga, especialmente o servidor WebDriver, que atua como uma camada de tradução entre o protocolo WebDriver e as APIs nativas do navegador.

A abordagem do Pydoll simplifica isso para:

```mermaid
graph LR
    AS[Script de Automação] --> P[Pydoll]
    P --> B[Navegador via CDP]
```

Essa comunicação direta elimina a sobrecarga computacional e de rede do servidor intermediário, resultando em operações mais rápidas.

### 2. Agrupamento Eficiente de Comandos (Batching)

O CDP permite o agrupamento de múltiplos comandos em uma única mensagem, reduzindo o número de viagens de ida e volta (round trips) necessárias para operações complexas. Isso é particularmente valioso para operações que exigem várias etapas, como encontrar um elemento e depois interagir com ele.

### 3. Operação Assíncrona

A arquitetura orientada a eventos e baseada em WebSocket do CDP alinha-se perfeitamente com o framework asyncio do Python, permitindo uma verdadeira operação assíncrona. Isso permite ao Pydoll:

- Executar múltiplas operações concorrentemente
- Processar eventos à medida que ocorrem
- Evitar o bloqueio da thread principal durante operações de I/O

```mermaid
graph TD
    subgraph "Arquitetura Assíncrona Pydoll"
        EL[Loop de Eventos]
        
        subgraph "Tarefas Concorrentes"
            T1[Tarefa 1: Navegar]
            T2[Tarefa 2: Esperar por Elemento]
            T3[Tarefa 3: Lidar com Eventos de Rede]
        end
        
        EL --> T1
        EL --> T2
        EL --> T3
        
        T1 --> WS[Conexão WebSocket]
        T2 --> WS
        T3 --> WS
        
        WS --> B[Navegador]
    end
```

!!! info "Ganhos de Desempenho Assíncrono"
    A combinação de asyncio e CDP cria um efeito multiplicador no desempenho. Em testes de benchmark, a abordagem assíncrona do Pydoll pode processar múltiplas páginas em paralelo com escalabilidade quase linear, enquanto ferramentas síncronas tradicionais veem retornos decrescentes à medida que a concorrência aumenta.
    
    Por exemplo, raspar 10 páginas que levam 2 segundos cada para carregar pode levar mais de 20 segundos com uma ferramenta síncrona, mas pouco mais de 2 segundos com a arquitetura assíncrona do Pydoll (mais uma sobrecarga mínima).

### 4. Controle Refinado (Fine-Grained)

O CDP fornece controle mais granular sobre o comportamento do navegador do que o protocolo WebDriver. Isso permite ao Pydoll implementar estratégias otimizadas para operações comuns:

- Condições de espera mais precisas (vs. timeouts arbitrários)
- Acesso direto a caches e armazenamento do navegador
- Execução direcionada de JavaScript em contextos específicos
- Controle detalhado da rede para otimização de requisições


## Conclusão

O Chrome DevTools Protocol forma a base da abordagem "zero-webdriver" do Pydoll para automação de navegador. Ao alavancar a comunicação WebSocket do CDP, a cobertura abrangente de domínios, a arquitetura orientada a eventos e a integração direta com o navegador, o Pydoll alcança desempenho e confiabilidade superiores em comparação com as ferramentas de automação tradicionais.

Nas seções seguintes, mergulharemos mais fundo em como o Pydoll implementa domínios CDP específicos e transforma o protocolo de baixo nível em uma API intuitiva e amigável ao desenvolvedor.


================================================
FILE: docs/pt/deep-dive/fundamentals/connection-layer.md
================================================
# Connection Handler (Gerenciador de Conexão)

O Connection Handler é a camada fundamental da arquitetura do Pydoll, servindo como a ponte entre seu código Python e o Chrome DevTools Protocol (CDP) do navegador. Este componente gerencia a conexão WebSocket com o navegador, lida com a execução de comandos e processa eventos de maneira assíncrona e não bloqueante.

```mermaid
graph TD
    A[Código Python] --> B[Connection Handler]
    B <--> C[WebSocket]
    C <--> D[Endpoint CDP do Navegador]

    subgraph "Connection Handler"
        E[Gerenciador de Comandos]
        F[Gerenciador de Eventos]
        G[Cliente WebSocket]
    end

    B --> E
    B --> F
    B --> G
```

## Modelo de Programação Assíncrona

O Pydoll é construído sobre o framework `asyncio` do Python, que permite operações de I/O (Entrada/Saída) não bloqueantes. Essa escolha de design é crítica para a automação de navegador de alto desempenho, pois permite que múltiplas operações ocorram concorrentemente sem esperar que cada uma seja concluída.

### Entendendo Async/Await


Para entender como async/await funciona na prática, vamos examinar um exemplo mais detalhado com duas operações concorrentes:

```python
import asyncio
from pydoll.browser.chrome import Chrome

async def fetch_page_data(url):
    print(f"Iniciando busca por {url}")
    browser = Chrome()
    await browser.start()
    page = await browser.get_page()
    
    # Navegação leva tempo - é aqui que cedemos o controle
    await page.go_to(url)
    
    # Obter título da página
    title = await page.execute_script("return document.title")
    
    # Extrair alguns dados
    description = await page.execute_script(
        "return document.querySelector('meta[name=\"description\"]')?.content || ''"
    )
    
    await browser.stop()
    print(f"Busca por {url} concluída")
    return {"url": url, "title": title, "description": description}

async def main():
    # Iniciar duas operações de página concorrentemente
    task1 = asyncio.create_task(fetch_page_data("https://example.com"))
    task2 = asyncio.create_task(fetch_page_data("https://github.com"))
    
    # Esperar que ambas terminem e obter resultados
    result1 = await task1
    result2 = await task2
    
    return [result1, result2]

# Rodar a função assíncrona
results = asyncio.run(main())
```

Este exemplo demonstra como podemos buscar dados de dois sites diferentes concorrentemente, potencialmente cortando o tempo total de execução quase pela metade em comparação com a execução sequencial.

#### Diagrama de Fluxo de Execução Assíncrona

Aqui está o que acontece no loop de eventos ao executar o código acima:

```mermaid
sequenceDiagram
    participant A as Código Principal
    participant B as Tarefa 1<br/> (example.com)
    participant C as Tarefa 2<br/> (github.com)
    participant D as Loop de Eventos
    
    A->>B: Criar tarefa1
    B->>D: Registrar no loop
    A->>C: Criar tarefa2
    C->>D: Registrar no loop
    D->>B: Executar até browser.start()
    D->>C: Executar até browser.start()
    D-->>B: Retomar após WebSocket conectado
    D-->>C: Retomar após WebSocket conectado
    D->>B: Executar até page.go_to()
    D->>C: Executar até page.go_to()
    D-->>B: Retomar após página carregada
    D-->>C: Retomar após página carregada
    B-->>A: Retornar resultado
    C-->>A: Retornar resultado
```

Este diagrama de sequência ilustra como o asyncio do Python gerencia as duas tarefas concorrentes em nosso código de exemplo:

1.  A função principal cria duas tarefas para buscar dados de sites diferentes
2.  Ambas as tarefas são registradas no loop de eventos
3.  O loop de eventos executa cada tarefa até encontrar uma declaração `await` (como `browser.start()`)
4.  Quando as operações assíncronas terminam (como uma conexão WebSocket sendo estabelecida), as tarefas retomam
5.  O loop continua a alternar entre as tarefas em cada ponto `await`
6.  Quando cada tarefa termina, ela retorna seu resultado para a função principal

No exemplo `fetch_page_data`, isso permite que ambas as instâncias do navegador trabalhem concorrentemente - enquanto uma está esperando uma página carregar, a outra pode estar progredindo. Isso é significativamente mais eficiente do que processar sequencialmente cada site, já que os tempos de espera de I/O não bloqueiam a execução de outras tarefas.

!!! info "Multitarefa Cooperativa"
    O Asyncio usa multitarefa cooperativa, onde as tarefas voluntariamente cedem o controle nos pontos `await`. Isso difere da multitarefa preemptiva (threads), onde as tarefas podem ser interrompidas a qualquer momento. A multitarefa cooperativa pode fornecer melhor desempenho para operações ligadas a I/O, mas requer codificação cuidadosa para evitar bloquear o loop de eventos.

## Implementação do Connection Handler

A classe `ConnectionHandler` é projetada para gerenciar tanto a execução de comandos quanto o processamento de eventos, fornecendo uma interface robusta para a conexão WebSocket do CDP.

### Inicialização da Classe

```python
def __init__(
    self,
    connection_port: int,
    page_id: str = 'browser',
    ws_address_resolver: Callable[[int], str] = get_browser_ws_address,
    ws_connector: Callable = websockets.connect,
):
    # Inicializar componentes...
```

O ConnectionHandler aceita vários parâmetros:

| Parâmetro | Tipo | Descrição |
|---|---|---|
| `connection_port` | `int` | Número da porta onde o endpoint CDP do navegador está escutando |
| `page_id` | `str` | Identificador para a página/alvo específico (use 'browser' para conexões em nível de navegador) |
| `ws_address_resolver` | `Callable` | Função para resolver a URL do WebSocket a partir do número da porta |
| `ws_connector` | `Callable` | Função para estabelecer a conexão WebSocket |

### Componentes Internos

O ConnectionHandler orquestra três componentes primários:

1.  **Conexão WebSocket**: Gerencia a comunicação WebSocket real com o navegador
2.  **Gerenciador de Comandos**: Lida com o envio de comandos e recebimento de respostas
3.  **Gerenciador de Eventos**: Processa eventos do navegador e dispara callbacks apropriados

```mermaid
classDiagram
    class ConnectionHandler {
        -_connection_port: int
        -_page_id: str
        -_ws_connection
        -_command_manager: CommandManager
        -_events_handler: EventsHandler
        +execute_command(command, timeout) async
        +register_callback(event_name, callback) async
        +remove_callback(callback_id) async
        +ping() async
        +close() async
        -_receive_events() async
    }

    class CommandManager {
        -_pending_commands: dict
        +create_command_future(command)
        +resolve_command(id, response)
        +remove_pending_command(id)
    }

    class EventsHandler {
        -_callbacks: dict
        -_network_logs: list
        -_dialog: dict
        +register_callback(event_name, callback, temporary)
        +remove_callback(callback_id)
        +clear_callbacks()
        +process_event(event) async
    }

    ConnectionHandler *-- CommandManager
    ConnectionHandler *-- EventsHandler
```

## Fluxo de Execução de Comando

Ao executar um comando através do CDP, o ConnectionHandler segue um padrão específico:

1.  Garantir que uma conexão WebSocket ativa exista
2.  Criar um objeto Future para representar a resposta pendente
3.  Enviar o comando pelo WebSocket
4.  Aguardar (await) o Future ser resolvido com a resposta
5.  Retornar a resposta ao chamador

```python
async def execute_command(self, command: dict, timeout: int = 10) -> dict:
    # Validar comando
    if not isinstance(command, dict):
        logger.error('Comando deve ser um dicionário.')
        raise exceptions.InvalidCommand('Comando deve ser um dicionário')

    # Garantir que a conexão está ativa
    await self._ensure_active_connection()
    
    # Criar future para este comando
    future = self._command_manager.create_command_future(command)
    command_str = json.dumps(command)

    # Enviar comando e aguardar resposta
    try:
        await self._ws_connection.send(command_str)
        response: str = await asyncio.wait_for(future, timeout)
        return json.loads(response)
    except asyncio.TimeoutError as exc:
        self._command_manager.remove_pending_command(command['id'])
        raise exc
    except websockets.ConnectionClosed as exc:
        await self._handle_connection_loss()
        raise exc
```

!!! warning "Timeout de Comando"
    Comandos que não recebem uma resposta dentro do período de timeout especificado lançarão um `TimeoutError`. Isso impede que scripts de automação fiquem travados indefinidamente devido a respostas ausentes. O timeout padrão é de 10 segundos, mas pode ser ajustado com base nos tempos de resposta esperados para operações complexas.

## Sistema de Processamento de Eventos

O sistema de eventos é um componente arquitetônico chave que permite padrões de programação reativa no Pydoll. Ele permite que você registre callbacks para eventos específicos do navegador e os execute automaticamente quando esses eventos ocorrem.

### Fluxo de Eventos

O fluxo de processamento de eventos segue estas etapas:

1.  O método `_receive_events` roda como uma tarefa em segundo plano, recebendo continuamente mensagens do WebSocket
2.  Cada mensagem é analisada e classificada como uma resposta de comando ou um evento
3.  Eventos são passados para o EventsHandler para processamento
4.  O EventsHandler identifica callbacks registrados para o evento e os invoca

```mermaid
flowchart TD
    A[Mensagem WebSocket] --> B{É Resposta de Comando?}
    B -->|Sim| C[Resolver Future do Comando]
    B -->|Não| D[Processar como Evento]
    D --> E[Encontrar Callbacks Correspondentes]
    E --> F[Executar Callbacks]
    F --> G{É Temporário?}
    G -->|Sim| H[Remover Callback]
    G -->|Não| I[Manter Callback]
```

### Registro de Callback

O ConnectionHandler fornece métodos para registrar, remover e gerenciar callbacks de eventos:

```python
# Registrar um callback para um evento específico
callback_id = await connection.register_callback(
    'Page.loadEventFired', 
    handle_page_load
)

# Remover um callback específico
await connection.remove_callback(callback_id)

# Remover todos os callbacks
await connection.clear_callbacks()
```

!!! tip "Callbacks Temporários"
    Você pode registrar um callback como temporário, o que significa que ele será automaticamente removido após ser acionado uma vez. Isso é útil para eventos únicos, como o manuseio de diálogos:
    
    ```python
    await connection.register_callback(
        'Page.javascriptDialogOpening',
        handle_dialog,
        temporary=True
    )
    ```

### Execução Assíncrona de Callback

Callbacks podem ser funções síncronas ou corrotinas assíncronas. O EventsHandler (gerenciado pelo ConnectionHandler) lida com ambos os tipos adequadamente:

```python
# Callback síncrono
def synchronous_callback(event):
    print(f"Evento recebido: {event['method']}")

# Callback assíncrono
async def asynchronous_callback(event):
    await asyncio.sleep(0.1)  # Realizar alguma operação assíncrona
    print(f"Evento processado assincronamente: {event['method']}")

# Ambos podem ser registrados da mesma forma
await connection.register_callback('Network.requestWillBeSent', synchronous_callback)
await connection.register_callback('Network.responseReceived', asynchronous_callback)
```

**Modelo de Execução Sequencial:**

Callbacks assíncronos são **aguardados (awaited) sequencialmente** pelo EventsManager. Isso garante que, para um único evento, os callbacks sejam executados na ordem em que foram registrados, prevenindo condições de corrida (race conditions) quando múltiplos callbacks modificam estado compartilhado.

```python
# Dentro de EventsManager.process_event()
for callback_data in callbacks:
    if asyncio.iscoroutinefunction(callback_data['callback']):
        await callback_data['callback'](event_data)  # Await sequencial
    else:
        callback_data['callback'](event_data)  # Execução síncrona
```

A **execução não bloqueante** (para callbacks de UI que não devem bloquear outras operações) é alcançada em um **nível mais alto**, como no método `Tab.on()`, que envolve o callback do usuário em um `asyncio.create_task()` antes de registrá-lo aqui. Esta arquitetura fornece:

- **Camada inferior** (ConnectionHandler/EventsManager): Garante execução sequencial e ordem previsível
- **Camada superior** (Tab.on()): Fornece semântica não bloqueante quando necessário

!!! info "Detalhes da Arquitetura de Eventos"
    Veja [Análise Profunda da Arquitetura de Eventos](../architecture/event-architecture.md) para detalhes completos sobre o sistema de eventos multicamada e a lógica por trás da execução sequencial de callbacks.

## Gerenciamento de Conexão

O ConnectionHandler implementa várias estratégias para garantir conexões robustas:

### Estabelecimento Lento de Conexão (Lazy)

Conexões são estabelecidas apenas quando necessário, tipicamente quando o primeiro comando é executado ou quando explicitamente solicitado. Esta abordagem de inicialização lenta economiza recursos e permite um gerenciamento de conexão mais flexível.

### Reconexão Automática

Se a conexão WebSocket for perdida ou fechada inesperadamente, o ConnectionHandler tentará reestabelecê-la automaticamente quando o próximo comando for executado. Isso fornece resiliência contra problemas transitórios de rede.

```python
async def _ensure_active_connection(self):
    """
    Garante que uma conexão ativa exista antes de prosseguir.
    """
    if self._ws_connection is None or self._ws_connection.closed:
        await self._establish_new_connection()
```

### Limpeza de Recursos

O ConnectionHandler implementa tanto métodos de limpeza explícitos quanto o protocolo de gerenciador de contexto assíncrono do Python (`__aenter__` e `__aexit__`), garantindo que os recursos sejam devidamente liberados quando não mais necessários:

```python
async def close(self):
    """
    Fecha a conexão WebSocket e limpa todos os callbacks.
    """
    await self.clear_callbacks()
    if self._ws_connection is not None:
        try:
            await self._ws_connection.close()
        except websockets.ConnectionClosed as e:
            logger.info(f'Conexão WebSocket foi fechada: {e}')
        logger.info('Conexão WebSocket fechada.')
```

!!! info "Uso do Gerenciador de Contexto"
    Usar o ConnectionHandler como um gerenciador de contexto é o padrão recomendado para garantir a limpeza adequada dos recursos:
    
    ```python
    async with ConnectionHandler(9222, 'browser') as connection:
        # Trabalhar com a conexão...
        await connection.execute_command(...)
    # Conexão é automaticamente fechada ao sair do contexto
    ```

## Pipeline de Processamento de Mensagens

O ConnectionHandler implementa um pipeline sofisticado de processamento de mensagens que lida com o fluxo contínuo de mensagens da conexão WebSocket:

```mermaid
sequenceDiagram
    participant WS as WebSocket
    participant RCV as _receive_events
    participant MSG as _process_single_message
    participant PARSE as _parse_message
    participant CMD as _handle_command_message
    participant EVT as _handle_event_message
    
    loop Enquanto conectado
        WS->>RCV: mensagem
        RCV->>MSG: raw_message
        MSG->>PARSE: raw_message
        PARSE-->>MSG: JSON parseado ou None
        
        alt É resposta de comando
            MSG->>CMD: mensagem
            CMD->>CMD: resolve future do comando
        else É notificação de evento
            MSG->>EVT: mensagem
            EVT->>EVT: processa evento & dispara callbacks
        end
    end
```

Este pipeline garante o processamento eficiente tanto de respostas de comandos quanto de eventos assíncronos, permitindo ao Pydoll manter uma operação responsiva mesmo sob alto volume de mensagens.

## Uso Avançado

O ConnectionHandler é geralmente usado indiretamente através das classes Browser e Page, mas também pode ser usado diretamente para cenários avançados:

### Monitoramento Direto de Eventos

Para casos de uso especializados, você pode querer contornar as APIs de nível superior e monitorar diretamente eventos CDP específicos:

```python
from pydoll.connection.connection import ConnectionHandler

async def monitor_network():
    connection = ConnectionHandler(9222)
    
    async def log_request(event):
        url = event['params']['request']['url']
        print(f"Requisição: {url}")
    
    await connection.register_callback(
        'Network.requestWillBeSent', 
        log_request
    )
    
    # Habilitar eventos de rede via comando CDP
    await connection.execute_command({
        "id": 1,
        "method": "Network.enable"
    })
    
    # Manter rodando até ser interrompido
    try:
        while True:
            await asyncio.sleep(1)
    finally:
        await connection.close()
```

### Execução de Comando Personalizado

Você pode executar comandos CDP arbitrários diretamente:

```python
async def custom_cdp_command(connection, method, params=None):
    command = {
        "id": random.randint(1, 10000),
        "method": method,
        "params": params or {}
    }
    return await connection.execute_command(command)

# Exemplo: Obter HTML do documento sem usar a classe Page
async def get_html(connection):
    result = await custom_cdp_command(
        connection,
        "Runtime.evaluate",
        {"expression": "document.documentElement.outerHTML"}
    )
    return result['result']['result']['value']
```

!!! warning "Interface Avançada"
    O uso direto do ConnectionHandler requer um entendimento profundo do Chrome DevTools Protocol. Para a maioria dos casos de uso, as APIs de nível superior Browser e Page fornecem uma interface mais intuitiva e segura.


## Padrões Avançados de Concorrência

O design assíncrono do ConnectionHandler permite padrões sofisticados de concorrência:

### Execução Paralela de Comandos

Execute múltiplos comandos concorrentemente e espere por todos os resultados:

```python
async def get_page_metrics(connection):
    commands = [
        {"id": 1, "method": "Performance.getMetrics"},
        {"id": 2, "method": "Network.getResponseBody", "params": {"requestId": "..."}},
        {"id": 3, "method": "DOM.getDocument"}
    ]
    
    results = await asyncio.gather(
        *(connection.execute_command(cmd) for cmd in commands)
    )
    
    return results
```

## Conclusão

O ConnectionHandler serve como a fundação da arquitetura do Pydoll, fornecendo uma interface robusta e eficiente para o Chrome DevTools Protocol. Ao alavancar o framework asyncio do Python e a comunicação WebSocket, ele permite automação de navegador de alto desempenho com padrões de programação elegantes e orientados a eventos.

Entender o design e a operação do ConnectionHandler fornece insights valiosos sobre o funcionamento interno do Pydoll e oferece oportunidades para personalização avançada e otimização em cenários especializados.

Para a maioria dos casos de uso, você interagirá com o ConnectionHandler indiretamente através das APIs de nível superior Browser e Page, que fornecem uma interface mais intuitiva enquanto aproveitam as poderosas capacidades do ConnectionHandler.

================================================
FILE: docs/pt/deep-dive/fundamentals/iframes-and-contexts.md
================================================
# Iframes, OOPIFs e Contextos de Execução (Análise Aprofundada)

Entender como a automação de navegador lida com iframes é crucial para construir ferramentas de automação robustas. Este guia abrangente explora os fundamentos técnicos do manuseio de iframes no Pydoll, cobrindo o Document Object Model (DOM), mecânicas do Chrome DevTools Protocol (CDP), contextos de execução, mundos isolados e o sofisticado pipeline de resolução que torna a interação com iframes fluida.

!!! info "Primeiro o uso prático"
    Se você só precisa usar iframes em seus scripts de automação, comece com o guia de funcionalidades: **Funcionalidades → Automação → IFrames**.
    Esta análise aprofundada explica as decisões de arquitetura, nuances do protocolo e detalhes de implementação interna.

---

## Tabela de Conteúdos

1. [Fundação: O Modelo de Objeto de Documento (DOM)](#fundação-o-modelo-de-objeto-de-documento-dom)
2. [O que são Iframes e Por que Eles Importam](#o-que-são-iframes-e-por-que-eles-importam)
3. [O Desafio: Iframes Fora de Processo (OOPIFs)](#o-desafio-iframes-fora-de-processo-oopifs)
4. [Protocolo Chrome DevTools e Gerenciamento de Frames](#protocolo-chrome-devtools-e-gerenciamento-de-frames)
5. [Contextos de Execução e Mundos Isolados](#contextos-de-execução-e-mundos-isolados)
6. [Referência de Identificadores CDP](#referência-de-identificadores-cdp)
7. [Pipeline de Resolução do Pydoll](#pipeline-de-resolução-do-pydoll)
8. [Roteamento de Sessão e Modo "Flattened"](#roteamento-de-sessão-e-modo-flattened)
9. [Análise Aprofundada da Implementação](#análise-aprofundada-da-implementação)
10. [Considerações de Performance](#considerações-de-performance)
11. [Modos de Falha e Depuração](#modos-de-falha-e-depuração)

---

## Fundação: O Modelo de Objeto de Documento (DOM)

Antes de mergulhar nos iframes, precisamos entender o DOM — a estrutura em árvore que representa um documento HTML na memória.

### O que é o DOM?

O **Modelo de Objeto de Documento** (Document Object Model) é uma interface de programação para documentos HTML e XML. Ele representa a estrutura da página como uma árvore de nós, onde cada nó corresponde a uma parte do documento:

- **Nós de elemento**: Tags HTML como `<div>`, `<iframe>`, `<button>`
- **Nós de texto**: O conteúdo de texto real
- **Nós de atributo**: Atributos de elemento como `id`, `class`, `src`
- **Nó do documento**: A raiz da árvore

```mermaid
graph TD
    Document[Documento] --> HTML[elemento html]
    HTML --> Head[elemento head]
    HTML --> Body[elemento body]
    Body --> Div1[elemento div]
    Body --> Div2[elemento div]
    Div1 --> Text1[nó de texto: 'Olá']
    Div2 --> Iframe[elemento iframe]
    Iframe --> IframeDoc[documento do iframe]
    IframeDoc --> IframeBody[body do iframe]
    IframeBody --> IframeContent[conteúdo do iframe...]
```

### Propriedades da Árvore DOM

1. **Estrutura hierárquica**: Todo nó tem um pai (exceto o Documento) e pode ter filhos
2. **Identificação de nós**: Nós podem ser identificados por:
   - `nodeId`: Identificador interno dentro de um contexto de documento (domínio DOM)
   - `backendNodeId`: Identificador estável que pode referenciar nós através de diferentes documentos
3. **Representação viva**: Mudanças no DOM são refletidas imediatamente na árvore

### Por que Isso Importa para Iframes

Cada elemento `<iframe>` cria uma **árvore DOM nova e independente**. O próprio elemento iframe existe no DOM do pai, mas o conteúdo carregado no iframe tem seu próprio nó Documento completo e estrutura de árvore. Essa separação é a base de toda a complexidade dos iframes.

---

## O que são Iframes e Por que Eles Importam

### Definição

Um **iframe** (quadro em linha) é um elemento HTML (`<iframe>`) que incorpora outro documento HTML dentro da página atual. O documento incorporado mantém seu próprio contexto, incluindo:

- Estrutura HTML e árvore DOM independentes
- Ambiente de execução JavaScript separado
- Estilização CSS própria (a menos que explicitamente compartilhada)
- Histórico de navegação distinto

```html
<body>
  <h1>Página Pai</h1>
  <iframe src="https://example.com/embedded.html" id="content-frame"></iframe>
  <p>Mais conteúdo do pai</p>
</body>
```

### Casos de Uso Comuns

| Caso de Uso | Descrição | Exemplo |
|----------|-------------|---------|
| **Widgets de terceiros** | Incorpora conteúdo externo com segurança | Formulários de pagamento, feeds de mídia social, widgets de chat |
| **Isolamento de conteúdo** | Coloca conteúdo não confiável em sandbox | HTML gerado por usuário, anúncios |
| **Arquitetura modular** | Componentes reutilizáveis | Widgets de dashboard, sistemas de plugins |
| **Conteúdo de origem cruzada** | Carrega recursos de domínios diferentes | Mapas, players de vídeo, dashboards de analytics |

### Modelo de Segurança: Política de Mesma Origem (Same-Origin Policy)

O navegador impõe uma **Política de Mesma Origem** para iframes:

- **Iframes de mesma origem**: O pai pode acessar o DOM do iframe via JavaScript (`iframe.contentDocument`)
- **Iframes de origem cruzada**: O pai não pode acessar o DOM do iframe diretamente (restrição de segurança)

Essa barreira de segurança é o motivo pelo qual ferramentas de automação precisam de mecanismos especiais (como o CDP) para interagir com o conteúdo do iframe.

!!! warning "Importante para automação"
    Automação tradicional baseada em JavaScript (como as primeiras abordagens do Selenium) não pode acessar diretamente o conteúdo de iframes de origem cruzada devido à segurança do navegador. O CDP opera em um nível mais baixo, contornando essa limitação para fins de depuração.

---

## O Desafio: Iframes Fora de Processo (OOPIFs)

### O que são OOPIFs?

O Chromium moderno usa **isolamento de site** (site isolation) para segurança e estabilidade. Isso significa que origens diferentes podem ser renderizadas em processos separados do SO. Um iframe de uma origem diferente torna-se um **Iframe Fora de Processo (OOPIF)**.

```mermaid
graph LR
    subgraph "Processo 1: example.com"
        MainPage[DOM da Página Principal]
    end
    
    subgraph "Processo 2: widget.com"
        IframeDOM[DOM do Iframe]
    end
    
    MainPage -.Fronteira do Processo.-> IframeDOM
```

### Por que OOPIFs Complicam a Automação

| Aspecto | Iframe no Mesmo Processo | Iframe Fora de Processo (OOPIF) |
|--------|-------------------|-------------------------------|
| **Acesso ao DOM** | Árvore de documento compartilhada na memória | Alvo (target) separado com seu próprio documento |
| **Roteamento de comandos** | Conexão única | Requer anexação ao alvo e roteamento de sessão |
| **Árvore de frames** | Todos os frames em uma árvore | Frame raiz + alvos separados para OOPIFs |
| **Contexto JavaScript** | Mesmo contexto de execution | Contexto de execução diferente por processo |
| **Comunicação CDP** | Comandos diretos | Comandos devem incluir `sessionId` |

### A Abordagem Tradicional (Troca Manual de Contexto)

Sem um manuseio sofisticado, automatizar OOPIFs requer:

```python
# Abordagem tradicional (manual) com outras ferramentas
main_page = browser.get_page()
iframe_element = main_page.find_element_by_id("iframe-id")

# Deve trocar manualmente o contexto
driver.switch_to.frame(iframe_element)

# Agora os comandos miram o iframe
button = driver.find_element_by_id("button-in-iframe")
button.click()

# Deve trocar manualmente de volta
driver.switch_to.default_content()
```

**Problemas com esta abordagem:**

1. **Carga para o desenvolvedor**: Todo iframe requer gerenciamento explícito de contexto
2. **Iframes aninhados**: Cada nível precisa de outra troca
3. **Detecção de OOPIF**: Difícil saber quando a anexação manual é necessária
4. **Propenso a erros**: Esquecer de trocar de volta → comandos subsequentes falham
5. **Não componentizável**: Funções auxiliares precisam saber seu contexto de iframe

### A Solução do Pydoll: Resolução Transparente de Contexto

O Pydoll elimina a troca manual de contexto resolvendo os contextos de iframe automaticamente:

```python
# Abordagem Pydoll (sem troca manual)
iframe = await tab.find(id="iframe-id")
button = await iframe.find(id="button-in-iframe")
await button.click()

# Iframes aninhados? Mesmo padrão
outer = await tab.find(id="outer-iframe")
inner = await outer.find(tag_name="iframe")
button = await inner.find(text="Submit")
await button.click()
```

A complexidade é tratada internamente. Vamos explorar como.

---

## Protocolo Chrome DevTools e Gerenciamento de Frames

Como discutido em [Análise Aprofundada → Fundamentos → Protocolo Chrome DevTools](./cdp.md), o CDP fornece controle abrangente do navegador via comunicação WebSocket. O gerenciamento de frames é distribuído por múltiplos domínios do CDP.

### Domínios CDP Relevantes

#### 1. **Domínio Page**

Gerencia o ciclo de vida da página, frames e navegação.

**Métodos principais:**

- `Page.getFrameTree()`: Retorna a estrutura hierárquica de todos os frames em uma página
  ```json
  {
    "frameTree": {
      "frame": {
        "id": "main-frame-id",
        "url": "https://example.com",
        "securityOrigin": "https://example.com",
        "mimeType": "text/html"
      },
      "childFrames": [
        {
          "frame": {
            "id": "child-frame-id",
            "parentId": "main-frame-id",
            "url": "https://widget.com/embed"
          }
        }
      ]
    }
  }
  ```

- `Page.createIsolatedWorld(frameId, worldName)`: Cria um novo contexto de execução JavaScript em um frame específico
  ```json
  {
    "executionContextId": 42
  }
  ```

**Uso no Pydoll:**

```python
# De pydoll/elements/web_element.py
@staticmethod
async def _get_frame_tree_for(
    handler: ConnectionHandler, session_id: Optional[str]
) -> FrameTree:
    """Pega a árvore de frames da Página para a conexão/alvo dados."""
    command = PageCommands.get_frame_tree()
    if session_id:
        command['sessionId'] = session_id
    response: GetFrameTreeResponse = await handler.execute_command(command)
    return response['result']['frameTree']
```

#### 2. **Domínio DOM**

Fornece acesso à estrutura do DOM.

**Métodos principais:**

- `DOM.describeNode(objectId)`: Retorna informação detalhada sobre um nó DOM
  ```json
  {
    "node": {
      "nodeId": 123,
      "backendNodeId": 456,
      "nodeName": "IFRAME",
      "frameId": "parent-frame-id",
      "contentDocument": {
        "frameId": "iframe-frame-id",
        "documentURL": "https://embedded.com/page.html"
      }
    }
  }
  ```

- `DOM.getFrameOwner(frameId)`: Retorna o `backendNodeId` do elemento `<iframe>` que possui um frame
  ```json
  {
    "backendNodeId": 456
  }
  ```

**Uso no Pydoll:**

```python
# De pydoll/elements/web_element.py
@staticmethod
async def _owner_backend_for(
    handler: ConnectionHandler, session_id: Optional[str], frame_id: str
) -> Optional[int]:
    """Pega o backendNodeId do elemento DOM que possui o frame dado."""
    command = DomCommands.get_frame_owner(frame_id=frame_id)
    if session_id:
        command['sessionId'] = session_id
    response: GetFrameOwnerResponse = await handler.execute_command(command)
    return response.get('result', {}).get('backendNodeId')
```

#### 3. **Domínio Target**

Gerencia alvos (targets) do navegador (páginas, iframes, workers, etc.).

**Métodos principais:**

- `Target.getTargets()`: Lista todos os alvos disponíveis
  ```json
  {
    "targetInfos": [
      {
        "targetId": "page-target-id",
        "type": "page",
        "title": "Main Page",
        "url": "https://example.com"
      },
      {
        "targetId": "iframe-target-id",
        "type": "iframe",
        "title": "",
        "url": "https://widget.com/embed",
        "parentFrameId": "main-frame-id"
      }
    ]
  }
  ```

- `Target.attachToTarget(targetId, flatten)`: Anexa a um alvo para depuração
  - Quando `flatten=true`: Retorna um `sessionId` para rotear comandos no modo "flattened"
  - Toda comunicação acontece sobre o mesmo WebSocket, diferenciada por `sessionId`

**Uso no Pydoll:**

```python
# De pydoll/interactions/iframe.py (simplificado)
async def _resolve_oopif_by_parent(self, content_frame_id: str, ...):
    """Resolve um OOPIF usando o content frame id."""
    browser_handler = ConnectionHandler(...)
    targets_response: GetTargetsResponse = await browser_handler.execute_command(
        TargetCommands.get_targets()
    )
    target_infos = targets_response.get('result', {}).get('targetInfos', [])

    # Encontra alvos cujo parentFrameId bate
    direct_children = [
        target_info for target_info in target_infos
        if target_info.get('parentFrameId') == content_frame_id
    ]
    
    if direct_children:
        attach_response: AttachToTargetResponse = await browser_handler.execute_command(
            TargetCommands.attach_to_target(
                target_id=direct_children[0]['targetId'], 
                flatten=True
            )
        )
        attached_session_id = attach_response.get('result', {}).get('sessionId')
        # ... usa session_id para comandos subsequentes
```

#### 4. **Domínio Runtime**

Executa JavaScript e gerencia contextos de execução.

**Métodos principais:**

- `Runtime.evaluate(expression, contextId)`: Avalia JavaScript em um contexto de execução específico
- `Runtime.callFunctionOn(functionDeclaration, objectId)`: Chama uma função com um objeto específico como `this`

**Uso no Pydoll para acesso ao documento do iframe:**

```python
# De pydoll/elements/web_element.py
async def _set_iframe_document_object_id(self, execution_context_id: int):
    """Avalia document.documentElement no contexto do iframe e cacheia seu object id."""
    evaluate_command = RuntimeCommands.evaluate(
        expression='document.documentElement',
        context_id=execution_context_id,
    )
    if self._iframe_context and self._iframe_context.session_id:
        evaluate_command['sessionId'] = self._iframe_context.session_id
    
    evaluate_response: EvaluateResponse = await (
        (self._iframe_context.session_handler if self._iframe_context else None)
        or self._connection_handler
    ).execute_command(evaluate_command)
    
    document_object_id = evaluate_response.get('result', {}).get('result', {}).get('objectId')
    if self._iframe_context:
        self._iframe_context.document_object_id = document_object_id
```

---

## Contextos de Execução e Mundos Isolados

### O que é um Contexto de Execução?

Um **contexto de execução** é um ambiente onde o código JavaScript é executado. Todo frame em um navegador tem pelo menos um contexto de execution. O contexto inclui:

- **Objeto global** (`window` em navegadores)
- **Cadeia de escopo**: Como variáveis são resolvidas
- **Vínculo 'this'**: A o que `this` se refere
- **Ambiente de variáveis**: Todas as variáveis e funções declaradas

### Múltiplos Contextos por Frame

Um único frame pode ter múltiplos contextos de execução:

1. **Mundo principal (contexto padrão)**: Onde o JavaScript da própria página roda
2. **Mundos isolados**: Contextos separados que share o mesmo DOM mas têm escopos globais JavaScript diferentes

```mermaid
graph TB
    Frame[Frame: example.com/page]
    Frame --> MainWorld[Mundo Principal<br/>JavaScript da Página]
    Frame --> IsolatedWorld1[Mundo Isolado 1<br/>Script de conteúdo de extensão]
    Frame --> IsolatedWorld2[Mundo Isolado 2<br/>Automação Pydoll]
    
    DOM[Árvore DOM Compartilhada]
    MainWorld -.pode acessar.-> DOM
    IsolatedWorld1 -.pode acessar.-> DOM
    IsolatedWorld2 -.pode acessar.-> DOM
    
    MainWorld -.não pode acessar.-> IsolatedWorld1
    MainWorld -.não pode acessar.-> IsolatedWorld2
```

### O que é um Mundo Isolado?

Um **mundo isolado** é um contexto de execução JavaScript separado que:

- **Compartilha o mesmo DOM**: Pode ler/modificar elementos DOM
- **Tem um objeto global separado**: Variáveis/funções não vazam entre mundos
- **Previne interferência**: Scripts da página não podem detectar ou interferir com scripts do mundo isolado

**Origem**: Mundos isolados foram criados para extensões de navegador. Scripts de conteúdo (content scripts) rodam em mundos isolados para que possam interagir com o DOM da página sem:

- Scripts da página sobrescrevendo suas variáveis
- Serem detectados por código anti-tamper (anti-adulteração)
- Conflitar com o JavaScript da página

### Por que o Pydoll Usa Mundos Isolados para Iframes

Quando o Pydoll interage com o conteúdo de um iframe, ele cria um mundo isolado no contexto desse iframe. Isso fornece:

1. **Ambiente JavaScript limpo**: Sem conflitos com os scripts do próprio iframe
2. **Comportamento consistente**: Scripts de automação funcionam independentemente de qual JavaScript o iframe roda
3. **Anti-detecção**: O JavaScript do iframe não pode detectar facilmente a presença do Pydoll
4. **Avaliação segura**: Código de automação não pode acidentalmente disparar lógica da página

**Implementação:**

```python
# De pydoll/elements/web_element.py
@staticmethod
async def _create_isolated_world_for_frame(
    frame_id: str,
    handler: ConnectionHandler,
    session_id: Optional[str],
) -> int:
    """Cria um mundo isolado (Page.createIsolatedWorld) para o frame dado."""
    create_command = PageCommands.create_isolated_world(
        frame_id=frame_id,
        world_name=f'pydoll::iframe::{frame_id}',
        grant_universal_access=True,
    )
    if session_id:
        create_command['sessionId'] = session_id
    
    create_response: CreateIsolatedWorldResponse = await handler.execute_command(
        create_command
    )
    execution_context_id = create_response.get('result', {}).get('executionContextId')
    if not execution_context_id:
        raise InvalidIFrame('Incapaz de criar mundo isolado para o iframe')
    return execution_context_id
```

O parâmetro `grant_universal_access=True` permite ao mundo isolado:

- Acessar frames de origem cruzada (normalmente bloqueado pela política de mesma origem)
- Realizar operações privilegiadas necessárias para automação

!!! tip "Mundos isolados na prática"
    Toda vez que você usa `await iframe.find(...)`, o Pydoll avalia a consulta do seletor em um mundo isolado criado especificamente para aquele iframe. Isso garante que sua lógica de automação nunca conflite com o JavaScript do próprio iframe, e o iframe não possa detectar ou bloquear sua automação.

---

## Referência de Identificadores CDP

Entender os identificadores do CDP é crucial para o manuseio de iframes. Aqui está uma referência abrangente:

| Identificador | Domínio | Escopo | Propósito | Exemplo de Uso no Pydoll |
|------------|--------|-------|---------|----------------------|
| **`nodeId`** | DOM | Local do Documento | Identifica um nó DOM dentro de um contexto de documento específico | Operações internas do CDP; não é estável entre navegações |
| **`backendNodeId`** | DOM | Estável entre documentos | Identificador estável para um nó DOM; pode mapear frames para elementos donos | Usado para parear elementos iframe com IDs de frame via `DOM.getFrameOwner` |
| **`frameId`** | Page | Frame | Identifica um frame na árvore de frames da página | Usado para especificar qual frame para `Page.createIsolatedWorld` e travessia da árvore de frames |
| **`targetId`** | Target | Global | Identifica um alvo (target) de depuração (página, iframe, worker, etc.) | Usado para `Target.attachToTarget` para conectar a OOPIFs |
| **`sessionId`** | Target | Específico do Alvo | Roteia comandos para um alvo específico no modo "flattened" | Injetado em comandos para roteá-los ao OOPIF correto |
| **`executionContextId`** | Runtime | Frame + Mundo | Identifica um contexto de execução JavaScript (incluindo mundos isolados) | Retornado por `Page.createIsolatedWorld`; usado em `Runtime.evaluate` |
| **`objectId`** | Runtime | Contexto de Execução | Referência de objeto remoto (ex: elemento DOM, função, objeto) | Referência ao `document.documentElement` do iframe para consultas relativas |

### Relacionamentos dos Identificadores

Veja como os identificadores se relacionam durante a resolução do iframe:

```
┌─────────────────────────────────────────────────────────────────────────┐
│                         Fluxo de Resolução                              │
└─────────────────────────────────────────────────────────────────────────┘

1. Início: Elemento <iframe>
   └─ backendNodeId: 789
   
2. Encontrar Frame ─────────[DOM.getFrameOwner]──────────────┐
   └─ frameId: abc-123                                       │
                                                             │
3. OOPIF? Checar Origem ────[Origem diferente detectada]─────┤
   └─ targetId: xyz-456                                      │
                                                             │
4. Anexar ao Alvo ──────────[Target.attachToTarget]──────────┤
   └─ sessionId: session-789                                 │
                                                             │
5. Criar Mundo Isolado ─────[Page.createIsolatedWorld]───────┤
   └─ executionContextId: 42                                 │
                                                             │
6. Obter Documento ─────────[Runtime.evaluate]───────────────┘
   └─ objectId: obj-999
```

**Pontos chave de transformação:**

| De | Método | Para | Propósito |
|------|--------|-----|---------|
| `backendNodeId` | `DOM.getFrameOwner` | `frameId` | Encontrar qual frame é dono do elemento iframe |
| `targetId` | `Target.attachToTarget(flatten=true)` | `sessionId` | Conectar ao OOPIF para roteamento de comandos |
| `frameId` | `Page.createIsolatedWorld` | `executionContextId` | Criar ambiente JavaScript seguro |
| `executionContextId` | `Runtime.evaluate('document.documentElement')` | `objectId` | Obter referência ao documento do iframe |

### Representação no Código do Pydoll

```python
# De pydoll/elements/web_element.py
@dataclass
class _IFrameContext:
    """Encapsula todos os identificadores e informação de roteamento para um iframe."""
    frame_id: str                                   # frameId: identifica o frame
    document_url: Optional[str] = None              # URL carregada do frame
    execution_context_id: Optional[int] = None      # executionContextId: mundo isolado
    document_object_id: Optional[str] = None        # objectId: document.documentElement
    session_handler: Optional[ConnectionHandler] = None  # para alvos OOPIF
    session_id: Optional[str] = None                # sessionId: roteia comandos para OOPIF
```

Este dataclass é cacheado em cada `WebElement` representando um iframe, permitindo o roteamento automático de todas as operações subsequentes.

---

## Pipeline de Resolução do Pydoll

Quando você acessa um iframe no Pydoll (ex: `await iframe.find(...)`), um elaborado pipeline de resolução é executado nos bastidores. Esta seção detalha cada passo.

### Fluxo de Alto Nível

```mermaid
sequenceDiagram
    participant User as Usuário
    participant WebElement
    participant Pipeline as Pipeline de Resolução
    participant CDP
    
    Usuário->>WebElement: iframe.find(id='button')
    WebElement->>WebElement: Verifica se contexto do iframe está em cache
    alt Contexto não cacheado
        WebElement->>Pipeline: _ensure_iframe_context()
        Pipeline->>CDP: DOM.describeNode(iframe)
        CDP-->>Pipeline: Info do Nó (frameId?, backendNodeId, etc.)
        
        alt frameId não está na info do nó
            Pipeline->>Pipeline: _resolve_frame_by_owner()
            Pipeline->>CDP: Page.getFrameTree()
            CDP-->>Pipeline: Árvore de frames
            Pipeline->>CDP: DOM.getFrameOwner(cada frame)
            CDP-->>Pipeline: backendNodeId
            Pipeline->>Pipeline: Compara backendNodeId para achar frameId
        end
        
        alt frameId ainda faltando (OOPIF)
            Pipeline->>Pipeline: _resolve_oopif_by_parent()
            Pipeline->>CDP: Target.getTargets()
            CDP-->>Pipeline: Lista de alvos
            Pipeline->>CDP: Target.attachToTarget(targetId, flatten=true)
            CDP-->>Pipeline: sessionId
            Pipeline->>CDP: Page.getFrameTree(sessionId)
            CDP-->>Pipeline: Árvore de frames do OOPIF
        end
        
        Pipeline->>CDP: Page.createIsolatedWorld(frameId)
        CDP-->>Pipeline: executionContextId
        
        Pipeline->>CDP: Runtime.evaluate('document.documentElement', contextId)
        CDP-->>Pipeline: objectId (referência do documento)
        
        Pipeline->>WebElement: Cacheia _IFrameContext
    end
    
    WebElement->>WebElement: Usa contexto cacheado para find()
    WebElement-->>Usuário: Elemento Button (com contexto)
```

### Análise Aprofundada Passo a Passo

#### **Passo 1: Descrever o Elemento Iframe**

**Objetivo**: Extrair metadados do elemento DOM `<iframe>`.

**Método**: `DOM.describeNode(objectId=iframe_object_id)`

**O que obtemos**:

- `backendNodeId`: Identificador estável para o elemento iframe
- `frameId` (de `contentDocument`): Se o conteúdo do iframe já está carregado e no mesmo processo
- `documentURL`: A URL carregada no iframe
- `parentFrameId` (do campo `frameId` no nó): O frame contendo este elemento iframe

**Código**:

```python
# De pydoll/interactions/iframe.py
async def resolve(self) -> IFrameContext:
    """Resolve e retorna o contexto do iframe."""
    base_handler, base_session_id = self._get_base_session()
    node_info = await self._describe_element_node(base_handler, base_session_id)
    frame_id, document_url, content_frame_id, backend_node_id = self._extract_frame_metadata(
        node_info
    )
    # ... continua resolução
```

**Auxiliar**:

```python
@staticmethod
def _extract_frame_metadata(
    node_info: Node,
) -> tuple[Optional[str], Optional[str], Optional[str], Optional[int]]:
    """Extrai metadados relacionados a iframe de um Nó DOM.describeNode."""
    content_document = node_info.get('contentDocument') or {}
    content_frame_id = node_info.get('frameId')
    backend_node_id = node_info.get('backendNodeId')
    frame_id = content_document.get('frameId')
    document_url = (
        content_document.get('documentURL')
        or content_document.get('baseURL')
        or node_info.get('documentURL')
        or node_info.get('baseURL')
    )
    return frame_id, document_url, content_frame_id, backend_node_id
```

**Resultado**:

- **Se `frame_id` está presente**: Ótimo! O iframe está no mesmo processo; prossiga para o Passo 4.
- **Se `frame_id` está faltando**: O iframe pode ser um OOPIF ou não totalmente carregado; prossiga para o Passo 2.

---

#### **Passo 2: Resolver Frame pelo Dono (comparação de backendNodeId)**

**Objetivo**: Encontrar o `frameId` comparando o `backendNodeId` do elemento iframe com os donos de frames na árvore de frames.

**Estratégia**:

1. Buscar a árvore de frames da página (`Page.getFrameTree`)
2. Para cada frame na árvore, chamar `DOM.getFrameOwner(frameId)` para obter o `backendNodeId` do elemento iframe dono
3. Comparar com o `backendNodeId` do nosso iframe
4. Quando eles baterem, encontramos o `frameId` correto

**Código**:

```python
# De pydoll/elements/web_element.py
async def _resolve_frame_by_owner(
    self,
    base_handler: ConnectionHandler,
    base_session_id: Optional[str],
    backend_node_id: int,
    current_document_url: Optional[str],
) -> tuple[Optional[str], Optional[str]]:
    """Resolve um ID de frame e URL comparando o backend_node_id do dono."""
    owner_frame_id, owner_url = await self._find_frame_by_owner(
        base_handler, base_session_id, backend_node_id
    )
    if not owner_frame_id:
        return None, current_document_url
    return owner_frame_id, owner_url or current_document_url

async def _find_frame_by_owner(
    self, handler: ConnectionHandler, session_id: Optional[str], backend_node_id: int
) -> tuple[Optional[str], Optional[str]]:
    """Encontra um frame comparando o backend_node_id do dono do elemento <iframe>."""
    frame_tree = await self._get_frame_tree_for(handler, session_id)
    for frame_node in WebElement._walk_frames(frame_tree):
        candidate_frame_id = frame_node.get('id', '')
        if not candidate_frame_id:
            continue
        owner_backend_id = await self._owner_backend_for(
            handler, session_id, candidate_frame_id
        )
        if owner_backend_id == backend_node_id:
            return candidate_frame_id, frame_node.get('url')
    return None, None
```

**Por que isso é necessário**:

- `DOM.describeNode` às vezes não inclui o `contentDocument.frameId` para iframes de origem cruzada ou carregados tardiamente
- A árvore de frames sempre contém todos os frames (mesmo OOPIFs), então podemos achá-lo indiretamente

**Resultado**:

- **Se `frameId` encontrado**: Prossiga para o Passo 4.
- **Se ainda não encontrado**: O iframe é provavelmente um OOPIF em um alvo separado; prossiga para o Passo 3.

---

#### **Passo 3: Resolver OOPIF pelo Frame Pai**

**Objetivo**: Para Iframes Fora de Processo, encontrar o alvo correto, anexar a ele e obter o `frameId` da árvore de frames do alvo (e o `sessionId` de roteamento quando necessário).

**Quando esse passo roda**:

- Iframes de **mesma origem** / in-process que já têm um `frameId` e **não** têm `backendNodeId` pulam esse passo (são tratados diretamente).
- Iframes **cross-origin / OOPIF** (com `backendNodeId`) ou iframes cujo `frameId` não pôde ser resolvido no Passo 2 usam esse passo.

**Estratégia**:

**3a. Busca por alvo filho direto (caminho rápido)**:

1. Chamar `Target.getTargets()` para listar todos os alvos de depuração.
2. Filtrar alvos onde `type` é `"iframe"` ou `"page"` e `parentFrameId` bate com nosso frame pai.
3. Se houver **apenas um** filho direto **e não houver `backendNodeId`**, anexar diretamente a esse alvo com `Target.attachToTarget(targetId, flatten=true)`.
4. Buscar `Page.getFrameTree(sessionId)` para aquele alvo; o frame raiz dessa árvore é o frame do nosso iframe.

Quando existem **múltiplos** filhos diretos ou temos um `backendNodeId` (caso típico de OOPIF), o Pydoll itera sobre cada alvo filho:

1. Anexa com `Target.attachToTarget(flatten=true)`.
2. Busca `Page.getFrameTree(sessionId)` e lê o `frame.id` raiz.
3. Chama `DOM.getFrameOwner(frameId=root_id)` na conexão principal.
4. Compara o `backendNodeId` retornado com o `backendNodeId` do elemento `<iframe>` original.
5. O filho cujo dono raiz coincide é selecionado como o alvo OOPIF correto.

**3b. Fallback: Escanear todos os alvos (dono raiz + busca por filho)**:

Se nenhum filho direto adequado for encontrado (ou se `parentFrameId` estiver incompleto), o Pydoll recorre a escanear **todos** os alvos iframe/page:

1. Iterar todos os alvos iframe/page.
2. Anexar a cada um e buscar sua árvore de frames.
3. Primeiro, tentar casar o **dono do frame raiz** via `DOM.getFrameOwner(root_frame_id)` com o `backendNodeId` do iframe.
4. Se isso não bater, procurar um **frame filho** cujo `parentId` seja o `content_frame_id` (isso cobre casos em que o OOPIF está aninhado sob um frame intermediário).

**Código**:

```python
# De pydoll/interactions/iframe.py
async def _resolve_oopif_by_parent(
    self,
    content_frame_id: str,
    backend_node_id: Optional[int],
    base_handler: Optional[ConnectionHandler] = None,
    base_session_id: Optional[str] = None,
) -> tuple[Optional[ConnectionHandler], Optional[str], Optional[str], Optional[str]]:
    """Resolve um OOPIF usando o content frame id."""
    browser_handler = ConnectionHandler(
        connection_port=self._element._connection_handler._connection_port
    )
    targets_response: GetTargetsResponse = await browser_handler.execute_command(
        TargetCommands.get_targets()
    )
    target_infos = targets_response.get('result', {}).get('targetInfos', [])

    # O handler que pode resolver DOM.getFrameOwner para o contexto do elemento.
    # Quando o <iframe> está dentro de um OOPIF aninhado, o handler do Tab
    # não tem visibilidade; devemos rotear pela sessão que originalmente
    # encontrou o elemento.
    owner_handler = base_handler or self._element._connection_handler
    owner_session_id = base_session_id

    # Estratégia 3a: Filhos diretos (caminho rápido)
    direct_children = [
        target_info
        for target_info in target_infos
        if target_info.get('type') in {'iframe', 'page'}
        and target_info.get('parentFrameId') == content_frame_id
    ]

    is_single_child = len(direct_children) == 1
    for child_target in direct_children:
        attach_response: AttachToTargetResponse = await browser_handler.execute_command(
            TargetCommands.attach_to_target(
                target_id=child_target['targetId'], flatten=True
            )
        )
        attached_session_id = attach_response.get('result', {}).get('sessionId')
        if not attached_session_id:
            continue

        frame_tree = await self._get_frame_tree_for(browser_handler, attached_session_id)
        root_frame = (frame_tree or {}).get('frame', {})
        root_frame_id = root_frame.get('id', '')

        # Caso simples / mesma origem: filho único e sem backend_node_id
        if is_single_child and root_frame_id and backend_node_id is None:
            return (
                browser_handler,
                attached_session_id,
                root_frame_id,
                root_frame.get('url'),
            )

        # Caso OOPIF: confirmar propriedade via DOM.getFrameOwner
        if root_frame_id and backend_node_id is not None:
            owner_backend_id = await self._owner_backend_for(
                owner_handler, owner_session_id, root_frame_id
            )
            if owner_backend_id == backend_node_id:
                return (
                    browser_handler,
                    attached_session_id,
                    root_frame_id,
                    root_frame.get('url'),
                )

    # Estratégia 3b: Escanear todos os alvos (dono raiz + busca por filho)
    for target_info in target_infos:
        if target_info.get('type') not in {'iframe', 'page'}:
            continue
        attach_response = await browser_handler.execute_command(
            TargetCommands.attach_to_target(
                target_id=target_info.get('targetId', ''), flatten=True
            )
        )
        attached_session_id = attach_response.get('result', {}).get('sessionId')
        if not attached_session_id:
            continue

        frame_tree = await self._get_frame_tree_for(browser_handler, attached_session_id)
        root_frame = (frame_tree or {}).get('frame', {})
        root_frame_id = root_frame.get('id', '')

        # Match direto: content_frame_id igual ao root frame ID do alvo
        if root_frame_id and root_frame_id == content_frame_id:
            return (
                browser_handler,
                attached_session_id,
                root_frame_id,
                root_frame.get('url'),
            )

        # Primeiro tenta casar o dono do frame raiz via backend_node_id
        if root_frame_id and backend_node_id is not None:
            owner_backend_id = await self._owner_backend_for(
                owner_handler, owner_session_id, root_frame_id
            )
            if owner_backend_id == backend_node_id:
                return (
                    browser_handler,
                    attached_session_id,
                    root_frame_id,
                    root_frame.get('url'),
                )

        # Fallback: procurar frame filho cujo parentId seja content_frame_id
        child_frame_id = IFrameContextResolver._find_child_by_parent(
            frame_tree, content_frame_id
        )
        if child_frame_id:
            return browser_handler, attached_session_id, child_frame_id, None

    return None, None, None, None
```

**Resultado**:

- **Se OOPIF resolvido**: Agora temos `sessionId`, `session_handler`, e `frameId`; prossiga para o Passo 4.
- **Se resolução falhar**: Lança exceção `InvalidIFrame` (tratada em `_ensure_iframe_context`).

---

#### **Passo 4: Criar Mundo Isolado**

**Objetivo**: Criar um contexto de execução JavaScript separado no frame resolvido.

**Método**: `Page.createIsolatedWorld(frameId, worldName='pydoll::iframe::<frameId>', grantUniversalAccess=true)`

**Parâmetros**:
- `frameId`: O frame onde o mundo isolado é criado
- `worldName`: Identificador para o mundo (útil para depuração)
- `grantUniversalAccess`: Permite acesso de origem cruzada (necessário para automação)

**Resposta**: `{ executionContextId: 42 }`

**Código**:

```python
# De pydoll/elements/web_element.py
@staticmethod
async def _create_isolated_world_for_frame(
    frame_id: str,
    handler: ConnectionHandler,
    session_id: Optional[str],
) -> int:
    """Cria um mundo isolado para o frame dado."""
    create_command = PageCommands.create_isolated_world(
        frame_id=frame_id,
        world_name=f'pydoll::iframe::{frame_id}',
        grant_universal_access=True,
    )
    if session_id:
        create_command['sessionId'] = session_id
    create_response: CreateIsolatedWorldResponse = await handler.execute_command(create_command)
    execution_context_id = create_response.get('result', {}).get('executionContextId')
    if not execution_context_id:
        raise InvalidIFrame('Incapaz de criar mundo isolado para o iframe')
    return execution_context_id
```

**Por que mundo isolado**:

- **Isolamento**: Nosso JavaScript de automação não interfere com o JavaScript do iframe
- **Anti-detecção**: O iframe não pode detectar nossa presença facilmente
- **Consistência**: Comportamento é previsível independentemente do ambiente de script do iframe

**Resultado**: Temos um `executionContextId` para rodar JavaScript no iframe.

---

#### **Passo 5: Fixar o Documento do Iframe como um Objeto Runtime**

**Objetivo**: Obter uma referência `objectId` ao `document.documentElement` do iframe (o elemento `<html>` do iframe).

**Método**: `Runtime.evaluate(expression='document.documentElement', contextId=executionContextId)`

**Por que precisamos disso**:

- Para executar **consultas relativas** (como `element.querySelector()`) dentro do iframe
- O `objectId` permite usar `Runtime.callFunctionOn(objectId, ...)` com `this` vinculado ao documento do iframe

**Código**:

```python
# De pydoll/elements/web_element.py
async def _set_iframe_document_object_id(self, execution_context_id: int) -> None:
    """Avalia document.documentElement no contexto do iframe e cacheia seu object id."""
    evaluate_command = RuntimeCommands.evaluate(
        expression='document.documentElement',
        context_id=execution_context_id,
    )
    if self._iframe_context and self._iframe_context.session_id:
        evaluate_command['sessionId'] = self._iframe_context.session_id
    evaluate_response: EvaluateResponse = await (
        (self._iframe_context.session_handler if self._iframe_context else None)
        or self._connection_handler
    ).execute_command(evaluate_command)
    result_object = evaluate_response.get('result', {}).get('result', {})
    document_object_id = result_object.get('objectId')
    if not document_object_id:
        raise InvalidIFrame('Incapaz de obter referência do documento para o iframe')
    if self._iframe_context:
        self._iframe_context.document_object_id = document_object_id
```

**Resultado**: O `_IFrameContext` está agora totalmente populado e cacheado no `WebElement`.

---

#### **Passo 6: Cachear e Propagar Contexto**

**Objetivo**: Armazenar o contexto resolvido no elemento iframe e propagá-lo para todos os elementos filhos encontrados dentro do iframe.

**Cacheando**:

```python
# De pydoll/elements/web_element.py
def _init_iframe_context(
    self,
    frame_id: str,
    document_url: Optional[str],
    session_handler: Optional[ConnectionHandler],
    session_id: Optional[str],
) -> None:
    """Inicializa e cacheia contexto de iframe neste elemento."""
    self._iframe_context = _IFrameContext(frame_id=frame_id, document_url=document_url)
    # Limpa atributos de roteamento (estes eram para iframes aninhados)
    if hasattr(self, '_routing_session_handler'):
        delattr(self, '_routing_session_handler')
    if hasattr(self, '_routing_session_id'):
        delattr(self, '_routing_session_id')
    # Armazena roteamento OOPIF se necessário
    if session_handler and session_id:
        self._iframe_context.session_handler = session_handler
        self._iframe_context.session_id = session_id
```

**Propagação** (ao encontrar elementos dentro do iframe):

```python
# De pydoll/elements/mixins/find_elements_mixin.py
def _apply_iframe_context_to_element(
    self, element: WebElement, iframe_context: _IFrameContext | None
) -> None:
    """Propaga contexto de iframe para o elemento recém-criado."""
    if not iframe_context:
        return
    
    # Se o elemento filho também é um iframe, configura roteamento
    if getattr(element, 'is_iframe', False):
        element._routing_session_handler = (
            iframe_context.session_handler or self._connection_handler
        )
        element._routing_session_id = iframe_context.session_id
        element._routing_parent_frame_id = iframe_context.frame_id
        return
    
    # Caso contrário, injeta o contexto do iframe pai
    element._iframe_context = iframe_context
```

**Por que propagação importa**:

- Elementos encontrados dentro de um iframe herdam o contexto do iframe
- Isso garante que operações subsequentes (clicar, digitar, encontrar elementos aninhados) automaticamente usem o roteamento correto
- Iframes aninhados recebem informação de roteamento para que possam resolver seu próprio contexto relativo ao iframe pai

---

## Roteamento de Sessão e Modo "Flattened"

### O Modelo de Sessão "Flattened"

Como discutido em [Análise Aprofundada → Fundamentos → CDP](./cdp.md), o CDP tradicional usa conexões WebSocket separadas para cada alvo. O **Modo "Flattened"** (unificado) é uma otimização onde todos os alvos compartilham uma única conexão WebSocket, com comandos roteados usando um `sessionId`.

```mermaid
graph TB
    subgraph "Modo Tradicional"
        WS1[WebSocket 1] --> MainPage[Alvo Página Principal]
        WS2[WebSocket 2] --> Iframe1[Alvo OOPIF 1]
        WS3[WebSocket 3] --> Iframe2[Alvo OOPIF 2]
    end
    
    subgraph "Modo Flattened"
        WS[WebSocket Único] --> Router{Roteador CDP}
        Router -->|sessionId: null| MainPage2[Alvo Página Principal]
        Router -->|sessionId: session-1| Iframe3[Alvo OOPIF 1]
        Router -->|sessionId: session-2| Iframe4[Alvo OOPIF 2]
    end
```

### Como Funciona o Roteamento de Sessão

**Ao anexar a um OOPIF**:

```python
response = await handler.execute_command(
    TargetCommands.attach_to_target(targetId="iframe-target-id", flatten=True)
)
session_id = response['result']['sessionId']  # ex: "8E6C...-1234"
```

**Ao enviar um comando para aquele OOPIF**:

```python
command = PageCommands.get_frame_tree()
command['sessionId'] = 'session-1'  # Roteia para o OOPIF
response = await handler.execute_command(command)
```

A implementação CDP do navegador roteia o comando para o alvo correto baseado no `sessionId`.

### Roteamento de Comandos do Pydoll

Todo comando enviado por elementos Pydoll é automaticamente roteado para o alvo correto:

```python
# De pydoll/elements/mixins/find_elements_mixin.py
def _resolve_routing(self) -> tuple[ConnectionHandler, Optional[str]]:
    """Resolve handler e sessionId para o contexto atual."""
    # Verifica se elemento tem um contexto iframe com roteamento OOPIF
    iframe_context = getattr(self, '_iframe_context', None)
    if iframe_context and getattr(iframe_context, 'session_handler', None):
        return iframe_context.session_handler, getattr(iframe_context, 'session_id', None)
    
    # Verifica se elemento herdou roteamento de um iframe pai
    routing_handler = getattr(self, '_routing_session_handler', None)
    if routing_handler is not None:
        return routing_handler, getattr(self, '_routing_session_id', None)
    
    # Padrão: usa a conexão principal da aba
    return self._connection_handler, None

async def _execute_command(
    self, command: Command[T_CommandParams, T_CommandResponse]
) -> T_CommandResponse:
    """Executa comando CDP via handler resolvido (timeout 60s)."""
    handler, session_id = self._resolve_routing()
    if session_id:
        command['sessionId'] = session_id
    return await handler.execute_command(command, timeout=60)
```

**Lógica de roteamento**:

1. **Elemento dentro de iframe OOPIF**: Usa `iframe_context.session_id` e `iframe_context.session_handler`
2. **Iframe aninhado (filho de OOPIF)**: Usa `_routing_session_id` e `_routing_session_handler` herdados
3. **Elemento regular ou iframe no mesmo processo**: Usa conexão principal (`_connection_handler`), sem `sessionId`

### Tipagem de Comando Estendida

Para tornar `sessionId` seguro em termos de tipo (type-safe), o Pydoll estendeu o `Command` TypedDict:

```python
# De pydoll/protocol/base.py
class Command(TypedDict, Generic[T_CommandParams, T_CommandResponse]):
    """Estrutura base para todos os comandos."""
    id: NotRequired[int]
    method: str
    params: NotRequired[T_CommandParams]
    sessionId: NotRequired[str]  # Adicionado para roteamento de sessão flattened
```

Isso permite que checadores de tipo (type-checkers) reconheçam `command['sessionId'] = '...'` como válido sem suprimir avisos de tipo.

---

## Considerações de Performance

### Estratégia de Cache

**O primeiro acesso é caro**:

- `DOM.describeNode`: 1 ida e volta (round-trip)
- Recuperação da árvore de frames: 1+ idas e voltas (principal + alvos OOPIF)
- `DOM.getFrameOwner` por frame: N idas e voltas (no pior caso)
- `Target.getTargets` + anexações: 1 + M idas e voltas (M = número de alvos OOPIF)
- `Page.createIsolatedWorld`: 1 ida e volta
- `Runtime.evaluate` (documento): 1 ida e volta

**Total**: Potencialmente 5-20+ idas e voltas dependendo da estrutura da página.

**Acessos subsequentes são O(1)**:

- `iframe_context` é cacheado na instância `WebElement`
- Acessar `await iframe.iframe_context` múltiplas vezes retorna o valor cacheado imediatamente
- Todos os elementos encontrados dentro do iframe herdam o contexto (sem re-resolução)

### Otimização: Busca de Alvo "Filho Direto"

Em `_resolve_oopif_by_parent`, o Pydoll primeiro checa por filhos diretos por `parentFrameId`:

```python
direct_children = [
    target_info
    for target_info in target_infos
    if target_info.get('type') in {'iframe', 'page'}
    and target_info.get('parentFrameId') == content_frame_id
]
if direct_children:
    # Anexa hatchery, pula o escaneamento de todos os alvos
```

**Por que isso ajuda**:

- A maioria dos OOPIFs tem `parentFrameId` definido corretamente
- Evita anexar a cada alvo especulativamente
- Reduz idas e voltas de O(alvos) para O(1) no caso comum

### Resolução Paralela Assíncrona (Melhoria Futura)

Atualmente, a correspondência de dono de frame é sequencial (checa cada frame um por um). Uma otimização futura poderia paralelizar:

```python
# Atual (sequencial)
for frame_node in frames:
    owner = await self._owner_backend_for(...)
    if owner == backend_node_id:
        return frame_node['id']

# Potencial (paralelo)
results = await asyncio.gather(*(
    self._owner_backend_for(..., frame['id'])
    for frame in frames
))
for i, owner in enumerate(results):
    if owner == backend_node_id:
        return frames[i]['id']
```

Isso reduziria a latência de `N * RTT` para `RTT` (onde RTT = tempo de ida e volta).

---

## Modos de Falha e Depuração

### Cenários Comuns de Falha

#### 1. **InvalidIFrame: Incapaz de resolver frameId**

**Causa**:

- O iframe é criado dinamicamente e não inicializou completamente
- O iframe está em sandbox com políticas restritivas
- Problemas de rede atrasaram o carregamento do iframe

**Soluções**:

- **Esperar pelo iframe**: Use `await tab.find(id='iframe', timeout=10)` com um timeout
- **Verificar atributo sandbox**: Sandbox restritivo (`<iframe sandbox>`) pode bloquear algumas operações CDP
- **Estratégia de retentativa**: Implementar lógica de retentativa com backoff exponencial

**Depuração**:

```python
try:
    iframe = await tab.find(id='problem-iframe')
    context = await iframe.iframe_context
except InvalidIFrame as e:
    # Inspeciona o que temos
    node_info = await iframe._describe_node(object_id=iframe._object_id)
    print(f"Info do nó: {node_info}")
    
    # Checa árvore de frames manualmente
    frame_tree = await WebElement._get_frame_tree_for(tab._connection_handler, None)
    print(f"Árvore de frames: {frame_tree}")
```

#### 2. **InvalidIFrame: Incapaz de criar mundo isolado**

**Causa**:

- Frame foi destruído/navegou para longe entre os passos de resolução
- Bug do Chrome (raro)

**Soluções**:

- **Re-resolver contexto**: Limpar contexto cacheado e re-acessar
- **Verificar navegação**: Garantir que o iframe não esteja navegando durante a resolução

**Depuração**:

```python
# Limpa cache e retenta
iframe._iframe_context = None
context = await iframe.iframe_context
```

#### 3. **InvalidIFrame: Incapaz de obter referência do documento**

**Causa**:

- O mundo isolado foi criado mas o documento não está pronto
- O frame está prestes a navegar

**Soluções**:

- Esperar pelo carregamento do frame: Usar eventos Page para detectar `Page.frameNavigated` ou `Page.loadEventFired`
- Retentar com um pequeno atraso

#### 4. **Falhas de roteamento de sessão (comando expira ou retorna erro)**

**Causa**:

- Alvo OOPIF foi destacado (página navegou, iframe removido)
- `sessionId` está obsoleto

**Soluções**:

- **Re-anexar ao alvo**: Criar um novo `ConnectionHandler` e re-resolver OOPIF
- **Validar alvo**: Chamar `Target.getTargets()` para checar se o alvo ainda existe

**Depuração**:

```python
# Checa se sessão ainda é válida
targets = await handler.execute_command(TargetCommands.get_targets())
active_sessions = [t['targetId'] for t in targets['result']['targetInfos']]
print(f"Alvos ativos: {active_sessions}")

if iframe._iframe_context and iframe._iframe_context.session_id:
    print(f"Nossa sessão: {iframe._iframe_context.session_id}")
```

### Ferramentas de Diagnóstico

#### Habilitar logs do CDP

```python
import logging
logging.basicConfig(level=logging.DEBUG)
logger = logging.getLogger('pydoll')
logger.setLevel(logging.DEBUG)
```

Isso registra todos os comandos e respostas CDP, útil para rastrear os passos de resolução do iframe.

#### Inspecionar contexto do iframe

```python
iframe = await tab.find(id='my-iframe')
ctx = await iframe.iframe_context

print(f"Frame ID: {ctx.frame_id}")
print(f"Document URL: {ctx.document_url}")
print(f"Execution Context ID: {ctx.execution_context_id}")
print(f"Document Object ID: {ctx.document_object_id}")
print(f"Session ID (OOPIF): {ctx.session_id}")
print(f"Session Handler: {ctx.session_handler}")
```

---

## Conclusão

O manuseio de iframes do Pydoll representa uma implementação sofisticada das capacidades de gerenciamento de frames do CDP. Ao entender:

- **O DOM**: Estrutura em árvore e identificação de nós
- **Iframes**: Contextos de documento independentes e barreiras de segurança
- **OOPIFs**: Isolamento de site e arquitetura baseada em alvos
- **Domínios CDP**: Coordenação de Page, DOM, Target, Runtime
- **Contextos de Execução**: Mundos isolados para automação limpa
- **Identificadores**: Relacionamentos entre backendNodeId, frameId, targetId, sessionId, executionContextId, objectId
- **Pipeline de resolução**: Estratégia de fallback em múltiplos estágios para encontrar frames
- **Roteamento de sessão**: Modo "flattened" e roteamento automático de comandos

você pode apreciar por que a troca manual de contexto é eliminada. A complexidade é real, mas o Pydoll a abstrai por trás de uma API simples e intuitiva:

```python
iframe = await tab.find(id='login-frame')
username = await iframe.find(name='username')
await username.type_text('user@example.com')
```

Três linhas. Sem troca de contexto. Sem anexar alvos. Sem gerenciamento de sessão. Apenas funciona.

---

## Leitura Adicional

- **Especificação do CDP**: [Chrome DevTools Protocol - Domínio Page](https://chromedevtools.github.io/devtools-protocol/tot/Page/)
- **Especificação do CDP**: [Chrome DevTools Protocol - Domínio DOM](https://chromedevtools.github.io/devtools-protocol/tot/DOM/)
- **Especificação do CDP**: [Chrome DevTools Protocol - Domínio Target](https://chromedevtools.github.io/devtools-protocol/tot/Target/)
- **Especificação do CDP**: [Chrome DevTools Protocol - Domínio Runtime](https://chromedevtools.github.io/devtools-protocol/tot/Runtime/)
- **Isolamento de Site do Chromium**: [Site Isolation - The Chromium Projects](https://www.chromium.org/Home/chromium-security/site-isolation/)
- **Scripts de Conteúdo e Mundos Isolados**: [Chrome Extensions - Content Scripts](https://developer.chrome.com/docs/extensions/mv3/content_scripts/)
- **Documentação do Pydoll**: [Análise Aprofundada → Fundamentos → Protocolo Chrome DevTools](./cdp.md)
- **Documentação do Pydoll**: [Funcionalidades → Automação → IFrames](../../features/automation/iframes.md)

---

!!! tip "Filosofia de Design"
    O objetivo do manuseio de iframes do Pydoll é a **automação ergonômica**: escreva código como se iframes não existissem, e deixe a biblioteca lidar com a complexidade. Esta análise aprofundada mostrou o que acontece nos bastidores—mas você nunca precisa pensar sobre isso em seus scripts de automação.

================================================
FILE: docs/pt/deep-dive/fundamentals/index.md
================================================
# Análise Profunda: Fundamentos Essenciais

**Domine a base, e todo o resto se torna mais fácil.**

Esta seção cobre as **tecnologias fundamentais** que impulsionam o Pydoll: o Chrome DevTools Protocol (CDP), a comunicação assíncrona baseada em WebSocket e a integração do sistema de tipos do Python. Estes não são apenas detalhes de implementação, são as **decisões de design fundamentais** que tornam o Pydoll rápido, poderoso e seguro em tipos (type-safe).

## Por que os Fundamentos Importam

A maioria dos frameworks de automação abstrai sua camada de comunicação, deixando você com uma "caixa preta" que funciona até deixar de funcionar. Quando algo quebra, a depuração e a otimização tornam-se difíceis sem entender os mecanismos subjacentes.

**O Pydoll adota uma abordagem diferente**: expomos e explicamos os fundamentos, permitindo que você trabalhe tanto como um **usuário do framework** quanto como um **engenheiro de protocolo**.

!!! quote "O Poder dos Primeiros Princípios"
    **"Se você conhece o caminho amplamente, você o verá em todas as coisas."** - Miyamoto Musashi
    
    Entender o CDP, a comunicação assíncrona e os sistemas de tipos não é apenas sobre o Pydoll, é sobre entender **como a automação de navegador moderna funciona em sua essência**. Esse conhecimento se transfere para qualquer ferramenta baseada em CDP e qualquer projeto Python assíncrono.

## Os Três Pilares

### 1. Chrome DevTools Protocol (CDP)
**[→ Leia a Análise Profunda do CDP](./cdp.md)**

**O protocolo que impulsiona a automação de navegador moderna.**

O CDP é o protocolo de depuração nativo do Chrome, o mesmo que o Chrome DevTools (F12) usa. Ao se comunicar diretamente com o CDP, o Pydoll:

- **Elimina o WebDriver** (sem sobrecarga do Selenium, sem intermediários geckodriver/chromedriver)
- **Ganha controle profundo** (modifica requisições, intercepta eventos, executa operações privilegiadas)
- **Alcança velocidade nativa** (comunicação direta via WebSocket, sem polling HTTP)
- **Torna-se indetectável** (sem `navigator.webdriver`, sem fingerprints de WebDriver)

**O que você aprenderá:**

- Como o CDP organiza a funcionalidade em domínios (Page, Network, DOM, Fetch, etc.)
- A arquitetura de comando/evento que impulsiona a automação reativa
- Por que ferramentas baseadas em CDP são **fundamentalmente mais poderosas** que o Selenium
- Como ler a documentação do CDP e estender o Pydoll

**Por que isso importa**: O CDP não é apenas um detalhe de implementação do Pydoll, é a fundação da automação de navegador moderna. Puppeteer, Playwright e ferramentas similares, todas usam CDP. Entendê-lo uma vez fornece conhecimento aplicável a múltiplas ferramentas.

---

### 2. A Camada de Conexão
**[→ Leia a Arquitetura da Camada de Conexão](./connection-layer.md)**

**Comunicação assíncrona feita da maneira certa.**

Enquanto o CDP define **o que** você pode fazer, a Camada de Conexão define **como** o Pydoll se comunica com o navegador. É aqui que as mensagens de protocolo se tornam objetos Python, onde os padrões async/await permitem concorrência, e onde os WebSockets fornecem comunicação bidirecional em tempo real.

**O que você aprenderá:**

- Arquitetura WebSocket: conexões persistentes, enquadramento de mensagens, keep-alive
- O padrão async/await: por que `async def` e `await` permitem automação concorrente
- Correlação comando/resposta: como o Pydoll associa respostas a requisições
- Despacho de eventos: como eventos do navegador disparam callbacks Python
- Tratamento de erros: gerenciamento de timeout, falhas de conexão, degradação graciosa

**Por que isso importa**: A camada de conexão é a espinha dorsal da comunicação do Pydoll. Entendê-la permite:
- **Depuração eficaz**: Inspecionar mensagens fluindo entre Python e Chrome
- **Otimização de desempenho**: Identificar fontes de latência e paralelizar operações
- **Capacidades de extensão**: Adicionar comandos CDP personalizados ou modificar comportamento existente

---

### 3. Integração com Sistema de Tipos do Python
**[→ Leia a Análise Profunda do Sistema de Tipos](./typing-system.md)**

**Tipos fornecem tanto segurança quanto produtividade.**

O sistema de tipos do Python (introduzido no 3.5, melhorado em cada versão desde então) melhora significativamente a experiência de desenvolvimento. O Pydoll utiliza `TypedDict`, `Literal`, `overload` e genéricos para fornecer:

- **Autocompletar da IDE** para campos de resposta do CDP
- **Verificação de tipos (Type checking)** para pegar bugs antes do tempo de execução (`mypy`, `pyright`)
- **Código autodocumentado** (assinaturas de função revelam a estrutura)
- **Segurança na refatoração** (renomeie um campo, a IDE atualiza todos os usos)

**O que você aprenderá:**

- Como `TypedDict` modela estruturas de eventos/respostas do CDP
- Por que `overload` fornece tipos de retorno precisos para `find()`/`query()`
- Como genéricos (`TypeVar`, `Generic[T]`) permitem construção flexível de comandos
- Padrões práticos: anotar callbacks, tipar funções assíncronas, usar `Literal`
- Integração de ferramentas: configurar mypy, aproveitar a inferência de tipos da IDE

**Por que isso importa**: Dicas de tipo (type hints) tornaram-se cada vez mais importantes no Python moderno. A cobertura abrangente de tipos do Pydoll significa:
- **Desenvolvimento mais rápido**: Autocompletar revela campos e métodos disponíveis
- **Menos bugs**: Verificador de tipos pega erros antes que cheguem à produção
- **Melhor refatoração**: Mude assinaturas com confiança com suporte da IDE

---

## Como Esses Fundamentos se Conectam

Entender como CDP, comunicação assíncrona e sistemas de tipos funcionam **juntos** é a chave:

```mermaid
graph TB
    Python[Código Python:<br/>await tab.go_to#40;url#41;]
    
    Python --> TypeSystem[Sistema de Tipos:<br/>Assinatura da função revela<br/>parâmetros e tipo de retorno]
    
    TypeSystem --> ConnectionLayer[Camada de Conexão:<br/>Serializa comando para JSON,<br/>envia via WebSocket]
    
    ConnectionLayer --> CDP[CDP:<br/>Navegador recebe<br/>comando Page.navigate]
    
    CDP --> Browser[Chrome:<br/>Executa navegação,<br/>emite eventos]
    
    Browser --> CDPEvents[Eventos CDP:<br/>Page.loadEventFired,<br/>Network.requestWillBeSent]
    
    CDPEvents --> ConnectionLayer2[Camada de Conexão:<br/>Desserializa eventos,<br/>despacha para callbacks]
    
    ConnectionLayer2 --> TypedDicts[TypedDict:<br/>Dados do evento como<br/>dicionário tipado]
    
    TypedDicts --> PythonCallback[Callback Python:<br/>IDE mostra campos disponíveis<br/>via inferência de tipo]
```

**O fluxo**:

1.  Você escreve código Python com **anotações de tipo** (Sistema de Tipos)
2.  O código serializa para JSON e envia via **WebSocket** (Camada de Conexão)
3.  O navegador recebe e executa **comandos CDP** (CDP)
4.  O navegador emite **eventos CDP** de volta (CDP)
5.  Eventos desserializam em **instâncias de TypedDict** (Sistema de Tipos)
6.  Seus callbacks recebem **objetos de evento com tipos seguros** (Sistema de Tipos)

Cada camada **amplifica** as outras:

- Tipos tornam as respostas do CDP descobríveis
- O modelo de eventos do CDP permite padrões assíncronos
- A comunicação assíncrona torna os tipos essenciais (quais campos existem nesta resposta?)

## Trilha de Aprendizagem

Recomendamos esta progressão:

### Passo 1: CDP
**[Comece Aqui: Chrome DevTools Protocol](./cdp.md)**

Entenda o protocolo que impulsiona tudo. Aprenda domínios, comandos, eventos e como ler a documentação do CDP.

**Resultado**: Você saberá como encontrar e usar qualquer recurso do CDP, não apenas o que o Pydoll expõe.

### Passo 2: Camada de Conexão
**[Continue: Arquitetura da Camada de Conexão](./connection-layer.md)**

Análise profunda da comunicação WebSocket, padrões assíncronos e despacho de eventos.

**Resultado**: Você entenderá exatamente como as mensagens fluem entre Python e Chrome, permitindo depuração e otimização.

### Passo 3: Sistema de Tipos
**[Termine: Sistema de Tipos do Python](./typing-system.md)**

Aprenda como o Pydoll usa a tipagem moderna do Python para segurança e produtividade.

**Resultado**: Você escreverá automação com segurança de tipos e suporte total da IDE, pegando bugs antes que eles rodem.

## Pré-requisitos

Para tirar o máximo proveito desta seção:

- **Fundamentos de Python** - Funções, classes, decoradores
- **Básico de async/await** - Entender as palavras-chave `async def` e `await`
- **Familiaridade com JSON** - Saber como objetos/arrays serializam
- **Browser DevTools** - Ter usado o Inspetor do Chrome (F12)

**Se você é novo em Python assíncrono**, leia isto primeiro: [Real Python: Async IO in Python](https://realpython.com/async-io-python/)

## Além do Básico

Uma vez que você dominar esses fundamentos, estará pronto para:

- **[Arquitetura Interna](../architecture/browser-domain.md)** - Como os componentes do Pydoll se encaixam
- **[Rede e Segurança](../network/index.md)** - Entendimento em nível de protocolo para proxies
- **[Fingerprinting](../fingerprinting/index.md)** - Técnicas de detecção que exigem conhecimento de CDP

## Perguntas Comuns

### "Preciso entender isso para usar o Pydoll?"

**Não**, mas entender esses fundamentos o tornará mais eficaz. O uso básico funciona bem sem esse conhecimento. No entanto, quando você precisar:
- Depurar por que algo não está funcionando
- Otimizar automação lenta
- Estender o Pydoll com comandos CDP personalizados
- Entender mensagens de erro
- Contribuir para o projeto

Esses fundamentos se tornam muito úteis.

### "Isso não é muito baixo nível?"

Este nível de detalhe é intencional. A maioria dos frameworks esconde esses fundamentos, mas a abstração vem com trocas:

- Entendimento permite melhor depuração
- Visibilidade permite otimização
- Conhecimento permite extensão

Ao ensinar os fundamentos, permitimos que você vá além do que o Pydoll oferece de fábrica.

### "Quanto disso eu preciso memorizar?"

**Nada.** O objetivo é construir modelos mentais, não memorização. Após ler estas seções, você desenvolverá intuição para:

- "Isso precisa de CDP, deixe-me checar a documentação do protocolo"
- "Isso está lento por causa de awaits sequenciais, deixe-me paralelizar"
- "Este erro de tipo significa que estou usando o nome de campo errado"

Os detalhes específicos desaparecem, mas o entendimento permanece.

## Filosofia

Esses fundamentos representam conhecimento duradouro:

- **CDP** é o protocolo nativo do Chrome e continua a evoluir
- **Async/await** é o padrão do Python para concorrência
- **Sistemas de tipos** são cada vez mais importantes no Python (PEP 484 em diante)

Aprender esses conceitos agrega valor ao longo de sua carreira de desenvolvimento.

---

## Pronto para Construir Sua Base?

Comece com **[Chrome DevTools Protocol](./cdp.md)** para entender o protocolo que impulsiona tudo. Em seguida, progrida pela Camada de Conexão e Sistema de Tipos para completar seu entendimento fundamental.

**É aqui que a automação se torna engenharia.**

---

!!! tip "Após Completar os Fundamentos"
    Uma vez que você dominar esses conceitos, você os verá em **toda parte** na arquitetura do Pydoll:
    
    - Browser/Tab/WebElement todos usam a **Camada de Conexão**
    - Eventos de rede todos seguem o **modelo de eventos do CDP**
    - Todas as respostas usam **TypedDict** para segurança de tipos
    
    Os fundamentos não estão separados do Pydoll, eles **são** a fundação do Pydoll.

================================================
FILE: docs/pt/deep-dive/fundamentals/typing-system.md
================================================
# O Sistema de Tipos do Python e o Pydoll

O Pydoll utiliza extensivamente o sistema de tipos do Python para fornecer excelente suporte de IDE, detectar erros precocemente e tornar a API autodocumentada. Este guia explica o básico das dicas de tipo (type hints) e como o Pydoll as utiliza para aprimorar sua experiência de desenvolvimento.

## O Básico de Dicas de Tipo (Type Hints)

Dicas de tipo são anotações opcionais que especificam o tipo de valor que uma variável, parâmetro ou valor de retorno deve ter. Elas não afetam o comportamento em tempo de execução, mas habilitam ferramentas poderosas.

### Dicas de Tipo Simples

```python
# Tipos básicos
name: str = "Pydoll"
port: int = 9222
is_headless: bool = False
quality: float = 0.85

# Anotações de função
def navigate(url: str, timeout: int = 30) -> bool:
    # ... implementação
    return True
```

### Tipos de Contêineres

```python
from typing import List, Dict, Optional

# Listas e dicionários
urls: List[str] = ['https://example.com', 'https://google.com']
headers: Dict[str, str] = {'User-Agent': 'MyBot/1.0'}

# Valores opcionais (podem ser None)
target_id: Optional[str] = None

# Sintaxe moderna (Python 3.9+)
urls: list[str] = ['https://example.com']
headers: dict[str, str] = {'User-Agent': 'MyBot/1.0'}
```

!!! tip "Sintaxe do Python 3.9+"
    O código-fonte do Pydoll usa a sintaxe mais antiga `List[]`, `Dict[]` para compatibilidade retroativa, mas você pode usar `list[]`, `dict[]` em minúsculas no seu código se estiver usando Python 3.9+.

## TypedDict: Dicionários Estruturados

O `TypedDict` permite definir estruturas de dicionário com chaves e tipos de valor específicos. Isso é **amplamente utilizado** nas definições de protocolo CDP do Pydoll.

### TypedDict Básico

```python
from typing import TypedDict

class UserInfo(TypedDict):
    name: str
    age: int
    email: str

# A IDE sabe exatamente quais chaves existem
user: UserInfo = {
    'name': 'Alice',
    'age': 30,
    'email': 'alice@example.com'
}

# O Autocomplete funciona!
print(user['name'])  # IDE sugere: name, age, email
```

### Como o Pydoll Usa o TypedDict

O Pydoll define **cada comando, resposta e evento do CDP** como um TypedDict. Isso significa que sua IDE sabe exatamente quais propriedades estão disponíveis:

```python
# De pydoll/protocol/page/methods.py
class CaptureScreenshotParams(TypedDict, total=False):
    """Parâmetros para captureScreenshot."""
    format: ScreenshotFormat
    quality: int
    clip: Viewport
    fromSurface: bool
    captureBeyondViewport: bool
    optimizeForSpeed: bool

class CaptureScreenshotResult(TypedDict):
    """Resultado para o comando captureScreenshot."""
    data: str
```

Quando você chama métodos que retornam respostas do CDP, sua IDE autocompleta as chaves da resposta:

```python
async def example():
    response = await tab.take_screenshot(as_base64=True)
    
    # A IDE sabe que esta é uma CaptureScreenshotResponse
    # e sugere 'result' -> 'data'
    screenshot_data = response['result']['data']  # Autocomplete completo!
```

### Campos Opcionais vs Obrigatórios

O TypedDict suporta campos opcionais usando `NotRequired[]`:

```python
from typing import TypedDict, NotRequired

# De pydoll/protocol/network/methods.py
class GetCookiesParams(TypedDict):
    """Parâmetros para recuperar cookies do navegador."""
    urls: NotRequired[list[str]]  # Este campo é opcional
```

A flag `total=False` torna **todos** os campos opcionais:

```python
class CaptureScreenshotParams(TypedDict, total=False):
    format: ScreenshotFormat  # Todos os campos são opcionais
    quality: int
    clip: Viewport
```

!!! info "Mágica do Autocomplete"
    Quando você digita `response['`, sua IDE mostra todas as chaves disponíveis com seus tipos. Este é o superpoder do TypedDict em ação!

## Enums: Constantes com Tipo Seguro (Type-Safe)

Enums (enumerações) fornecem constantes com tipo seguro que sua IDE pode autocompletar. O Pydoll os usa extensivamente para valores CDP.

### Enums Básicos

```python
from enum import Enum

class ScreenshotFormat(str, Enum):
    JPEG = 'jpeg'
    PNG = 'png'
    WEBP = 'webp'

# IDE autocompleta os formatos disponíveis
format = ScreenshotFormat.PNG  # O tipo é ScreenshotFormat
print(format.value)  # 'png'
```

### Uso de Enums no Pydoll

```python
from pydoll.constants import Key
from pydoll.protocol.page.types import ScreenshotFormat
from pydoll.protocol.input.types import KeyModifier

# Encontrando elementos - usa kwargs, não enums
element = await tab.find(id='submit-btn')
element = await tab.find(class_name='btn-primary')
element = await tab.find(tag_name='button')

# Entrada de teclado - IDE sugere todas as teclas
await element.press_keyboard_key(Key.ENTER)
await element.press_keyboard_key(Key.TAB)
await element.press_keyboard_key(Key.ESCAPE)

# Modificadores são enums inteiros (para teclas especiais)
await element.press_keyboard_key(Key.TAB, modifiers=KeyModifier.SHIFT)

# Enum de formato de captura de tela
await tab.take_screenshot('file.webp', format=ScreenshotFormat.WEBP)
```

!!! tip "Autocomplete de Enum"
    Digite `Key.` ou `ScreenshotFormat.` e sua IDE mostrará todas as opções disponíveis. Chega de memorizar strings!

## Sobrecarga de Funções (Function Overloads)

Sobrecargas permitem que uma função retorne tipos diferentes com base em seus parâmetros. O Pydoll usa isso para fornecer informações de tipo precisas.

### Exemplo Básico de Sobrecarga

```python
from typing import overload

# Assinaturas de sobrecarga (não executadas)
@overload
def process(data: str) -> str: ...

@overload
def process(data: int) -> int: ...

# Implementação real
def process(data):
    return data * 2

# A IDE conhece os tipos de retorno
result1 = process("hello")  # Tipo: str
result2 = process(42)       # Tipo: int
```

### Uso de Sobrecarga no Pydoll

Os métodos `find()` e `query()` retornam tipos diferentes dependendo do parâmetro `find_all`:

```python
# De pydoll/elements/mixins/find_elements_mixin.py
class FindElementsMixin:
    @overload
    async def find(
        self, find_all: Literal[False] = False, **kwargs
    ) -> WebElement: ...
    
    @overload
    async def find(
        self, find_all: Literal[True], **kwargs
    ) -> list[WebElement]: ...
    
    async def find(
        self, find_all: bool = False, **kwargs
    ) -> Union[WebElement, list[WebElement]]:
        # Implementação...
```

No seu código:

```python
# find_all=False (padrão) - A IDE sabe que o tipo de retorno é WebElement
button = await tab.find(id='submit-btn')
await button.click()  # Métodos de elemento único disponíveis!

# find_all=True - A IDE sabe que o tipo de retorno é list[WebElement]
buttons = await tab.find(class_name='btn', find_all=True)
for btn in buttons:  # A IDE sabe que isso é uma lista!
    await btn.click()

# O mesmo com query()
element = await tab.query('#submit-btn')  # Tipo: WebElement
elements = await tab.query('.btn', find_all=True)  # Tipo: list[WebElement]
```

!!! tip "Inferência de Tipo Inteligente"
    Sua IDE sabe automaticamente se você está obtendo um único elemento ou uma lista com base no parâmetro `find_all`. Não é necessário casting ou asserções de tipo!

## Tipos Genéricos (Generic Types)

Genéricos são como "contêineres de tipo" que funcionam com tipos diferentes enquanto preservam a informação de tipo. Pense neles como modelos que se adaptam ao que você coloca dentro.

### Entendendo Genéricos: Uma Analogia Simples

Imagine uma `Caixa` que pode conter qualquer coisa. Sem genéricos:

```python
# Sem genéricos - A IDE não sabe o que está dentro
class Box:
    def __init__(self, content):
        self.content = content
    
    def get(self):
        return self.content

my_box = Box("hello")
item = my_box.get()  # Tipo: Unknown - poderia ser qualquer coisa!
```

Com genéricos:

```python
from typing import Generic, TypeVar

T = TypeVar('T')  # T é um "marcador de posição de tipo"

class Box(Generic[T]):
    def __init__(self, content: T):
        self.content = content
    
    def get(self) -> T:
        return self.content

# Agora a IDE sabe exatamente o que está dentro de cada caixa
string_box: Box[str] = Box("hello")
item1 = string_box.get()  # Tipo: str

number_box: Box[int] = Box(42)
item2 = number_box.get()  # Tipo: int

# List é um genérico embutido
numbers: list[int] = [1, 2, 3]  # Lista que contém ints
names: list[str] = ["Alice", "Bob"]  # Lista que contém strs
```

!!! tip "Genéricos Simplificam Dicas de Tipo"
    Em vez de escrever `Union[List[str], List[int], List[float], ...]` para todo tipo de lista possível, genéricos permitem que você escreva um `list[T]` reutilizável que se adapta ao que você coloca dentro.

### Exemplo de Genérico do Mundo Real

```python
from typing import TypeVar, Generic

T = TypeVar('T')

class Response(Generic[T]):
    """Um wrapper de resposta de API genérico."""
    def __init__(self, data: T, status: int):
        self.data = data
        self.status = status
    
    def get_data(self) -> T:
        return self.data

# Cada resposta preserva seu tipo de dado
user_response: Response[dict] = Response({"name": "Alice"}, 200)
user_data = user_response.get_data()  # Tipo: dict

count_response: Response[int] = Response(42, 200)
count = count_response.get_data()  # Tipo: int
```

### Como o Pydoll Usa Genéricos

O sistema de comandos CDP do Pydoll usa genéricos para garantir que o tipo de resposta corresponda ao comando:

```python
# De pydoll/protocol/base.py
from typing import Generic, TypeVar

T_CommandParams = TypeVar('T_CommandParams')
T_CommandResponse = TypeVar('T_CommandResponse')

class Command(TypedDict, Generic[T_CommandParams, T_CommandResponse]):
    """Estrutura base para todos os comandos."""
    id: NotRequired[int]
    method: str
    params: NotRequired[T_CommandParams]

class Response(TypedDict, Generic[T_CommandResponse]):
    """Estrutura base para todas as respostas."""
    id: int
    result: T_CommandResponse
```

Isso significa que quando você executa um comando, o tipo de resposta é automaticamente inferido:

```python
# PageCommands.navigate retorna Command[NavigateParams, NavigateResult]
command = PageCommands.navigate('https://example.com')

# ConnectionHandler.execute_command preserva o tipo genérico
response = await connection_handler.execute_command(command)

# A IDE sabe que response['result'] é NavigateResult (não apenas "qualquer dict")
frame_id = response['result']['frameId']  # Autocomplete funciona!
loader_id = response['result']['loaderId']  # Todos os campos são conhecidos!
```

!!! info "Por que Genéricos Importam no Pydoll"
    Sem genéricos, cada resposta CDP seria apenas tipada como `dict[str, Any]`, e você perderia todo o autocomplete. Com genéricos, a IDE sabe a estrutura exata de cada resposta com base em qual comando você enviou.

## Tipos de União (Union Types)

Uniões representam valores que podem ser de um de vários tipos:

```python
from typing import Union

# Pode ser string ou int
identifier: Union[str, int] = "user-123"
identifier = 456  # Também válido

# Sintaxe moderna (Python 3.10+)
identifier: str | int = "user-123"
```

### Uso de União no Pydoll

```python
# Caminhos de arquivo podem ser strings ou objetos Path
from pathlib import Path

async def upload_file(files: Union[str, Path, list[Union[str, Path]]]):
    # Lida com múltiplos tipos de entrada
    pass

# Todos estes funcionam:
await tab.expect_file_chooser('/path/to/file.txt')
await tab.expect_file_chooser(Path('/path/to/file.txt'))
await tab.expect_file_chooser(['/file1.txt', Path('/file2.txt')])
```

## Benefícios Práticos no Pydoll

### 1. Autocomplete Inteligente

Sua IDE sugere chaves, métodos e valores disponíveis:

```python
from pydoll.protocol.page.events import PageEvent
from pydoll.protocol.network.types import ResourceType
from pydoll.protocol.input.types import KeyModifier
from pydoll.constants import Key

# Autocomplete para nomes de eventos
await tab.on(PageEvent.LOAD_EVENT_FIRED, callback)
await tab.on(PageEvent.JAVASCRIPT_DIALOG_OPENING, callback)

# Autocomplete para tipos de recursos
await tab.enable_fetch_events(resource_type=ResourceType.XHR)
await tab.enable_fetch_events(resource_type=ResourceType.DOCUMENT)

# Autocomplete para teclas
await element.press_keyboard_key(Key.ENTER)
await element.press_keyboard_key(Key.TAB, modifiers=KeyModifier.SHIFT)

# Autocomplete para kwargs em find()
element = await tab.find(id='submit-btn')  # IDE sugere: id, class_name, tag_name, etc.
```

### 2. Pegue Erros Cedo

Verificadores de tipo como mypy ou Pylance pegam erros antes do tempo de execução:

```python
# Verificador de tipo pega isso
await tab.take_screenshot('file.png', quality='high')  # Erro: quality deve ser int

# Verificador de tipo pega isso
event = await tab.find(id='button')
await tab.on(event, callback)  # Erro: event é WebElement, não str

# Correto
await tab.take_screenshot('file.png', quality=90)
await tab.on(PageEvent.LOAD_EVENT_FIRED, callback)
```

### 3. Código Autodocumentado

Os tipos servem como documentação embutida:

```python
# Você sabe imediatamente o que cada parâmetro espera
async def take_screenshot(
    self,
    path: Optional[str] = None,
    quality: int = 100,
    beyond_viewport: bool = False,
    as_base64: bool = False,
) -> Optional[str]:
    pass
```

### 4. Navegação em Respostas CDP

Navegue em respostas CDP complexas com confiança:

```python
# De pydoll/protocol/browser/methods.py
class GetVersionResult(TypedDict):
    protocolVersion: str
    product: str
    revision: str
    userAgent: str
    jsVersion: str

# No seu código
version_info = await browser.get_version()

# IDE sugere todas as chaves disponíveis
print(version_info['product'])         # Autocomplete!
print(version_info['userAgent'])       # Autocomplete!
print(version_info['protocolVersion']) # Autocomplete!
```

## Verificando Tipos no Seu Código

### Usando Pylance (VS Code)

O Pylance fornece verificação de tipos em tempo real no VS Code:

1.  Instale a extensão Pylance
2.  Defina o modo de verificação de tipos nas configurações:

```json
{
    "python.analysis.typeCheckingMode": "basic"  // ou "strict"
}
```

Agora você obtém feedback instantâneo:

```python
from pydoll.browser.chromium import Chrome

async def main():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Pylance mostra os tipos dos parâmetros enquanto você digita
        await tab.go_to('https://example.com', timeout=30)
        
        # Pylance avisa sobre tipos errados
        await tab.take_screenshot(quality='high')  # Aviso!
```

### Usando mypy

Execute o mypy para verificar seu projeto inteiro:

```bash
pip install mypy
mypy your_script.py
```

Exemplo de saída:

```
your_script.py:10: error: Argument "quality" to "take_screenshot" has incompatible type "str"; expected "int"
Found 1 error in 1 file (checked 1 source file)
```

## Sistema de Tipos de Protocolo do Pydoll

O diretório `protocol/` do Pydoll contém definições de tipo abrangentes para todo o Chrome DevTools Protocol:

```
pydoll/protocol/
├── base.py              # Tipos genéricos Command, Response, CDPEvent
├── browser/
│   ├── events.py        # Enum BrowserEvent, TypedDicts de parâmetros de evento
│   ├── methods.py       # Enums de métodos do Browser, TypedDicts de parâmetro/resultado
│   └── types.py         # Tipos do domínio Browser (Bounds, PermissionType, etc.)
├── dom/
│   ├── events.py        # Definições de eventos DOM
│   ├── methods.py       # Definições de comandos DOM
│   └── types.py         # Tipos DOM (Node, BackendNode, etc.)
├── page/
│   ├── events.py        # Eventos de Page (LOAD_EVENT_FIRED, etc.)
│   ├── methods.py       # Métodos de Page (navigate, captureScreenshot, etc.)
│   └── types.py         # Tipos de Page (Frame, ScreenshotFormat, etc.)
├── network/
│   └── ...              # Tipos do domínio Network
└── ...                  # Outros domínios CDP
```

### Exemplo: Fluxo de Tipo Completo

Vamos rastrear um fluxo de tipo completo, do comando à resposta:

```python
# 1. Enum de Método (protocol/page/methods.py)
class PageMethod(str, Enum):
    CAPTURE_SCREENSHOT = 'Page.captureScreenshot'

# 2. TypedDict de Parâmetro (protocol/page/methods.py)
class CaptureScreenshotParams(TypedDict, total=False):
    format: ScreenshotFormat
    quality: int
    clip: Viewport

# 3. TypedDict de Resultado (protocol/page/methods.py)
class CaptureScreenshotResult(TypedDict):
    data: str

# 4. Criação do Comando (commands/page_commands.py)
class PageCommands:
    @staticmethod
    def capture_screenshot(
        format: Optional[ScreenshotFormat] = None,
        quality: Optional[int] = None,
        ...
    ) -> Command[CaptureScreenshotParams, CaptureScreenshotResult]:
        return {
            'method': PageMethod.CAPTURE_SCREENSHOT,
            'params': {...}
        }

# 5. Uso na Tab (browser/tab.py)
class Tab:
    async def take_screenshot(...) -> Optional[str]:
        response: CaptureScreenshotResponse = await self._execute_command(
            PageCommands.capture_screenshot(...)
        )
        screenshot_data = response['result']['data']  # Totalmente tipado!
        return screenshot_data
```

Cada etapa mantém a informação de tipo, dando a você autocomplete e verificação de tipos por toda parte!

## Melhores Práticas

### 1. Deixe os Tipos do Pydoll Guiarem Você

Não lute contra os tipos, eles estão lá para ajudar:

```python
# Bom: Use kwargs (IDE autocompleta nomes de parâmetros)
element = await tab.find(id='submit-btn')
button = await tab.find(class_name='btn-primary')

# Bom: Use enums onde aplicável
from pydoll.constants import Key
await element.press_keyboard_key(Key.ENTER)

# Evite: Strings mágicas
await element.press_keyboard_key('Enter')  # Sem autocomplete, propenso a erros
```

### 2. Explore os Tipos na Sua IDE

Passe o mouse sobre as variáveis para ver seus tipos:

```python
# Passe o mouse sobre 'response' para ver: Response[CaptureScreenshotResult]
response = await tab._execute_command(PageCommands.capture_screenshot(...))

# Passe o mouse sobre 'data' para ver: str
data = response['result']['data']
```


### 3. Não Anote em Excesso

A inferência de tipos do Python é inteligente, não anote tudo:

```python
# Demais
name: str = "Alice"
count: int = 5
is_active: bool = True

# Deixe o Python inferir literais simples
name = "Alice"
count = 5
is_active = True

# Anote quando o tipo não for óbvio
from typing import Optional

result: Optional[WebElement] = await tab.find(id='missing', raise_exc=False)
```

## Aprenda Mais

Para um entendimento mais profundo do sistema de tipos do Python e do protocolo CDP:

- **[Documentação de typing do Python](https://docs.python.org/3/library/typing.html)**: Referência oficial de typing do Python
- **[PEP 484](https://peps.python.org/pep-0484/)**: A proposta original das dicas de tipo
- **[Chrome DevTools Protocol](https://chromedevtools.github.io/devtools-protocol/)**: Documentação do CDP
- **[Análise Profunda: CDP](./cdp.md)**: Como o Pydoll implementa o CDP
- **[Referência da API: Protocol](../api/protocol/base.md)**: Definições de tipo de protocolo do Pydoll

O sistema de tipos transforma o Pydoll de uma simples biblioteca de automação em um framework **seguro em tipos, autodocumentado e amigável à IDE**. Ele pega bugs antes que aconteçam e torna a exploração da API muito mais fácil!

================================================
FILE: docs/pt/deep-dive/guides/index.md
================================================
# Guias Práticos

**A teoria encontra a prática, padrões acionáveis para desafios reais de automação.**

Enquanto as outras seções de Análise Profunda exploram **fundamentos** e **arquitetura**, esta seção fornece **guias práticos e testados em batalha** para cenários comuns de automação. Estes não são exercícios acadêmicos, são padrões refinados através do uso em produção.

## O Propósito dos Guias

Você aprendeu:

- **[Fundamentos](../fundamentals/cdp.md)** - CDP, async, tipos
- **[Arquitetura](../architecture/browser-domain.md)** - Padrões de design interno
- **[Rede](../network/index.md)** - Protocolos e proxies
- **[Fingerprinting](../fingerprinting/index.md)** - Detecção e evasão

E agora? **Como você aplica esse conhecimento a problemas reais?**

É para isso que servem os guias: **fazer a ponte entre teoria e prática**.

!!! quote "Sabedoria Prática"
    **"Na teoria, teoria e prática são a mesma coisa. Na prática, não são."** - Yogi Berra
    
    Os guias destilam conhecimento técnico complexo em **padrões acionáveis** que você pode usar imediatamente. Eles mostram **o que funciona** em produção, não apenas o que é teoricamente possível.

## Guias Atuais

### Seletores CSS vs XPath
**[→ Leia o Guia de Seletores](./selectors-guide.md)**

**O eterno debate, resolvido com dados e melhores práticas.**

Escolher entre seletores CSS e XPath não é sobre preferência. É sobre entender **trocas (tradeoffs)**, **características de desempenho** e **manutenibilidade**.

**O que você aprenderá**:

- **Comparação de sintaxe** - Exemplos lado a lado para padrões comuns
- **Benchmarks de desempenho** - Medições reais, não mitos
- **Poder vs simplicidade** - Quando o CSS não é suficiente (correspondência de texto, eixos)
- **Suporte do navegador** - Compatibilidade e casos extremos
- **Melhores práticas** - Quando usar cada um, anti-padrões a evitar
- **Exemplos complexos** - Desafios de seletores do mundo real resolvidos

**Por que isso importa**: A localização de elementos é a **base** da automação. Escolha a ferramenta errada, e você lutará com seus seletores para sempre. Escolha sabiamente, e a automação se torna direta.

---

## Em Breve

### Asyncio e Automação Concorrente
**Chegando em futuras versões**

**Análise profunda do asyncio do Python: internos do loop de eventos, padrões práticos de concorrência e exemplos do mundo real.**

Entender o asyncio é fundamental para o Pydoll. Este guia fornece uma análise abrangente do loop de eventos do Python, primitivas de concorrência e como aplicá-las à automação de navegador sem armadilhas (footguns).

**Cobrirá**:

- **Internos do Loop de Eventos**: Como `asyncio.run()` funciona, agendamento de tarefas e fluxo de execução
- **Análise Profunda de Async/Await**: Corrotinas, futuros (futures) e a máquina de estados assíncrona
- **Primitivas de Concorrência**: `gather()`, `create_task()`, `TaskGroup`, e quando usar cada um
- **Limitação de Taxa (Rate Limiting)**: Semáforos, filas e estratégias de throttling
- **Exemplos do Mundo Real**: Raspagem multi-abas, preenchimento de formulário paralelo, instâncias de navegador coordenadas
- **Armadilhas Comuns**: Bloquear o loop de eventos, cancelamento de tarefas, propagação de exceções
- **Análise de Desempenho**: Profiling de código assíncrono, identificando gargalos, otimizando I/O

**Por que isso importa**: O Asyncio move a arquitetura do Pydoll. Domine-o, e você desbloqueará a verdadeira automação concorrente sem condições de corrida (race conditions) ou corrupção de estado.

---

### Padrões Arquiteturais e Seletores Robustos
**Chegando em futuras versões**

**Padrão PageObject, seletores sustentáveis e abordagens arquiteturais para automação escalável.**

Vá além de scripts ad-hoc para arquiteturas de automação estruturadas e sustentáveis. Aprenda padrões que escalam de scripts simples para sistemas de produção.

**Cobrirá**:

- **Padrão PageObject**: Encapsulando estrutura da página, reduzindo duplicação, melhorando manutenibilidade
- **Estratégias de Seletores Robustos**: Construindo seletores que sobrevivem a mudanças na página, evitando localizadores frágeis
- **Abstração de Componentes**: Componentes reutilizáveis para padrões comuns de UI (modais, dropdowns, tabelas)
- **Estratégias de Espera**: Padrões de espera inteligentes além de simples timeouts
- **Gerenciamento de Estado**: Gerenciando o estado da automação através de páginas e fluxos
- **Padrões de Teste**: Como estruturar código de automação para testabilidade
- **Arquitetura do Mundo Real**: Estrutura e organização de projeto prontas para produção

**Por que isso importa**: A diferença entre scripts descartáveis e sistemas de automação sustentáveis é a arquitetura. Aprenda padrões que tornam seu código resiliente a mudanças.

---

## Filosofia dos Guias

Os guias seguem princípios consistentes:

### 1. Código Pronto para Produção
Todos os exemplos são **completos e testados**, não pseudocódigo ou demonstrações simplificadas. Você pode copiar, colar e adaptar às suas necessidades.

### 2. Cenários do Mundo Real
Os guias abordam **problemas reais** encontrados na automação de produção, não exemplos artificiais.

### 3. Análise de Tradeoffs (Trocas)
Quando existem múltiplas abordagens, os guias as **comparam** objetivamente com prós/contras, não apenas "aqui está uma maneira".

### 4. Complexidade Progressiva
Comece simples, adicione complexidade incrementalmente. Padrão básico primeiro, depois casos extremos e variações avançadas.

### 5. Anti-Padrões Destacados
Mostra **o que NÃO fazer** explicitamente, erros comuns pegos através de revisão de código ou depuração em produção.

## Como Usar os Guias

Guias são **material de referência**, não tutoriais sequenciais:

- **Examine** em busca de padrões relevantes para o seu problema atual
- **Marque (Bookmark)** guias que você precisará repetidamente
- **Adapte** exemplos ao seu contexto específico
- **Combine** padrões de múltiplos guias

Não leia sequencialmente de capa a capa.
Não copie cegamente sem entender os tradeoffs.
Não use padrões desatualizados (verifique a data de publicação).

## Contribuindo com Guias

Tem um padrão que vale a pena compartilhar? Os guias são **impulsionados pela comunidade**:

**O que faz um bom guia**:

- Resolve um **problema real** encontrado em produção
- Fornece **código funcional**, não apenas conceitos
- Compara **múltiplas abordagens** com tradeoffs
- Destaca **erros comuns** explicitamente
- Explica **por quê**, não apenas **como**

Veja [Contribuindo](../../CONTRIBUTING.md) para diretrizes de submissão.

## Guias vs Documentação de Funcionalidades

**Confuso sobre a diferença?**

|| Documentação de Funcionalidades | Guias de Análise Profunda |
|---|---|---|
| **Propósito** | Ensinar o que o Pydoll pode fazer | Mostrar como resolver problemas |
| **Escopo** | Método/funcionalidade única | Múltiplas funcionalidades combinadas |
| **Profundidade** | Referência de API + exemplos | Padrões + tradeoffs + melhores práticas |
| **Ordem** | Estruturado por componente | Estruturado por problema |
| **Exemplos** | Simples, isolados | Complexos, prontos para produção |

**Use Funcionalidades para**: Aprender a API do Pydoll
**Use Guias para**: Resolver desafios reais de automação

## Além dos Guias

Após dominar os padrões práticos:

- **[Arquitetura](../architecture/browser-domain.md)** - Entenda por que os padrões funcionam
- **[Rede](../network/index.md)** - Otimização em nível de rede
- **[Fingerprinting](../fingerprinting/evasion-techniques.md)** - Técnicas anti-detecção

Guias fornecem **valor imediato**. Arquitetura fornece **entendimento profundo**. Ambos tornam você eficaz.

---

## Pronto para Padrões Práticos?

Comece com **[Seletores CSS vs XPath](./selectors-guide.md)** para dominar a localização de elementos, a fundação de toda automação.

**Mais guias em breve. Marque o repositório com estrela (Star) para se manter atualizado!**

---

!!! tip "Solicite um Guia"
    Tem um padrão de automação que você gostaria de ver documentado? Abra uma issue intitulada "Solicitação de Guia: [Tópico]" descrevendo:
    
    - O problema que você está tentando resolver
    - O que você tentou até agora
    - Por que a documentação existente não cobre isso
    
    Nós priorizamos guias com base na necessidade da comunidade.

## Referência Rápida

**Disponível Agora:**

- [Seletores CSS vs XPath](./selectors-guide.md)

**Em Breve:**

- Asyncio e Automação Concorrente
- Padrões Arquiteturais e Seletores Robustos

**Cronograma**: Novos guias adicionados com base no feedback da comunidade e aprendizados de produção.

================================================
FILE: docs/pt/deep-dive/guides/selectors-guide.md
================================================
# Seletores CSS vs XPath: Um Guia Completo

Ao usar o método `query()`, você tem duas poderosas linguagens de seletores à sua disposição: Seletores CSS e XPath. Entender quando e como usar cada um é crucial para a localização eficaz de elementos.

## Diferenças Fundamentais

| Aspecto | Seletor CSS | XPath |
|---|---|---|
| **Sintaxe** | Simples, semelhante a CSS | Linguagem de caminho XML |
| **Desempenho** | Mais rápido (suporte nativo do navegador) | Ligeiramente mais lento |
| **Direção** | Atravessa apenas para baixo e lateralmente | Pode atravessar em qualquer direção |
| **Correspondência de Texto** | Limitada (pseudo-seletores) | Funções de texto poderosas |
| **Complexidade** | Melhor para casos simples a moderados | Excelente em relacionamentos complexos |
| **Legibilidade** | Mais intuitivo para desenvolvedores web | Curva de aprendizado mais íngreme |

## Quando Usar Seletores CSS

Seletores CSS são ideais para:

- Seleção simples de elementos por ID, classe ou tag
- Relacionamentos diretos pai-filho
- Correspondência de atributos com padrões simples
- Cenários críticos de desempenho
- Ao atravessar para baixo no DOM

```python
# Exemplos de CSS limpos e performáticos
await tab.query("#login-form")
await tab.query(".submit-button")
await tab.query("div.container > p.intro")
await tab.query("input[type='email'][required]")
await tab.query("ul.menu li:first-child")
```

## Quando Usar XPath

XPath é ideal para:

- Correspondência de texto complexa e buscas parciais de texto
- Atravessar para cima até elementos pais
- Encontrar elementos relativos a irmãos
- Lógica condicional em seletores
- Relacionamentos DOM complexos

```python
# Exemplos poderosos de XPath
await tab.query("//button[contains(text(), 'Submit')]")
await tab.query("//input[@name='email']/parent::div")
await tab.query("//td[text()='John']/following-sibling::td[2]")
await tab.query("//div[contains(@class, 'product') and @data-price > 100]")
```

## Referência de Sintaxe de Seletor CSS

### Seletores Básicos

```python
# Seletor de elemento
await tab.query("div")              # Primeiro elemento <div>
await tab.query("div", find_all=True)  # Todos os elementos <div>
await tab.query("button")           # Primeiro elemento <button>

# Seletor de ID
await tab.query("#username")        # Elemento com id="username"

# Seletor de classe
await tab.query(".submit-btn")      # Primeiro elemento com class="submit-btn"
await tab.query(".submit-btn", find_all=True)  # Todos os elementos com a classe
await tab.query(".btn.primary")     # Primeiro elemento com ambas as classes

# Seletor universal
await tab.query("*", find_all=True) # Todos os elementos
```

### Combinadores

```python
# Combinador descendente (espaço)
await tab.query("div p")            # Primeiro <p> dentro de <div>
await tab.query("div p", find_all=True)  # Todos os <p> dentro de <div> (qualquer profundidade)

# Combinador filho (>)
await tab.query("div > p")          # Primeiro <p> que é filho direto de <div>
await tab.query("div > p", find_all=True)  # Todos os <p> que são filhos diretos

# Combinador irmão adjacente (+)
await tab.query("h1 + p")           # <p> imediatamente após <h1>

# Combinador irmão geral (~)
await tab.query("h1 ~ p")           # Primeiro <p> irmão após <h1>
await tab.query("h1 ~ p", find_all=True)  # Todos os <p> irmãos após <h1>
```

### Seletores de Atributo

```python
# Atributo existe
await tab.query("input[required]")                # Primeiro input com 'required'
await tab.query("input[required]", find_all=True) # Todos os inputs com 'required'

# Atributo igual
await tab.query("input[type='email']")            # Primeiro input de email
await tab.query("input[type='email']", find_all=True)  # Todos os inputs de email

# Atributo contém palavra
await tab.query("div[class~='active']")           # Primeiro div com classe 'active'

# Atributo começa com
await tab.query("a[href^='https://']")            # Primeiro link HTTPS
await tab.query("a[href^='https://']", find_all=True)  # Todos os links HTTPS

# Atributo termina com
await tab.query("img[src$='.png']")               # Primeira imagem PNG
await tab.query("img[src$='.png']", find_all=True)     # Todas as imagens PNG

# Atributo contém substring
await tab.query("a[href*='example']")             # Primeiro link com 'example'
await tab.query("a[href*='example']", find_all=True)   # Todos os links com 'example'

# Correspondência insensível a maiúsculas/minúsculas (case-insensitive)
await tab.query("input[type='text' i]")           # Correspondência case-insensitive
```

### Pseudo-classes

```python
# Pseudo-classes estruturais
await tab.query("li:first-child")                 # Primeiro <li> que é primeiro filho
await tab.query("li:last-child")                  # Primeiro <li> que é último filho
await tab.query("li:nth-child(2)")                # Primeiro <li> que é 2º filho
await tab.query("li:nth-child(odd)", find_all=True)  # Todos os <li> ímpares
await tab.query("li:nth-child(even)", find_all=True)  # Todos os <li> pares
await tab.query("li:nth-child(3n)", find_all=True)    # A cada 3º <li>

# Pseudo-classes baseadas em tipo
await tab.query("p:first-of-type")                # Primeiro <p> entre irmãos
await tab.query("p:last-of-type")                 # Último <p> entre irmãos
await tab.query("p:nth-of-type(2)")               # Segundo <p> entre irmãos

# Pseudo-classes de estado
await tab.query("input:enabled")                  # Primeiro input habilitado
await tab.query("input:enabled", find_all=True)   # Todos os inputs habilitados
await tab.query("input:disabled")                 # Primeiro input desabilitado
await tab.query("input:checked")                  # Primeiro checkbox/radio marcado
await tab.query("input:focus")                    # Input atualmente focado

# Outras pseudo-classes úteis
await tab.query("div:empty")                      # Primeiro elemento vazio
await tab.query("div:empty", find_all=True)       # Todos os elementos vazios
await tab.query("div:not(.exclude)")              # Primeiro div sem a classe
await tab.query("div:not(.exclude)", find_all=True)  # Todos os divs sem a classe
```

## Referência de Sintaxe XPath

### Expressões de Caminho Básicas

```python
# Caminho absoluto (da raiz)
await tab.query("/html/body/div")                 # Primeiro div no caminho exato

# Caminho relativo (de qualquer lugar)
await tab.query("//div")                          # Primeiro elemento <div>
await tab.query("//div", find_all=True)           # Todos os elementos <div>
await tab.query("//div/p")                        # Primeiro <p> dentro de qualquer <div>
await tab.query("//div/p", find_all=True)         # Todos os <p> dentro de qualquer <div>

# Nó atual
await tab.query("./div")                          # Primeiro <div> relativo ao atual

# Nó pai
await tab.query("..")                             # Pai do nó atual
```

### Seleção de Atributo

```python
# Correspondência básica de atributo
await tab.query("//input[@type='email']")         # Primeiro input de email
await tab.query("//input[@type='email']", find_all=True)  # Todos os inputs de email
await tab.query("//div[@id='content']")           # Div com id='content'

# Múltiplos atributos
await tab.query("//input[@type='text' and @required]")  # Primeira correspondência
await tab.query("//input[@type='text' and @required]", find_all=True)  # Todas as correspondências
await tab.query("//div[@class='card' or @class='panel']")  # Primeiro card ou panel

# Atributo existe
await tab.query("//button[@disabled]")            # Primeiro botão desabilitado
await tab.query("//button[@disabled]", find_all=True)  # Todos os botões desabilitados
```

## Eixos (Axes) XPath (Navegação Direcional)

O poder real do XPath vem de sua habilidade de navegar em qualquer direção através da árvore DOM.

### Tabela de Referência de Eixos

| Eixo | Direção | Descrição | Exemplo |
|---|---|---|---|
| `child::` | Para baixo | Apenas filhos diretos | `//div/child::p` |
| `descendant::` | Para baixo | Todos os descendentes (qualquer profundidade) | `//div/descendant::a` |
| `parent::` | Para cima | Pai imediato | `//input/parent::div` |
| `ancestor::` | Para cima | Todos os ancestrais (qualquer profundidade) | `//span/ancestor::div` |
| `following-sibling::` | Lateralmente | Irmãos após o atual | `//h1/following-sibling::p` |
| `preceding-sibling::` | Lateralmente | Irmãos antes do atual | `//p/preceding-sibling::h1` |
| `following::` | Para frente | Todos os nós após o atual | `//h1/following::*` |
| `preceding::` | Para trás | Todos os nós antes do atual | `//h1/preceding::*` |
| `ancestor-or-self::` | Para cima | Ancestrais + atual | `//div/ancestor-or-self::*` |
| `descendant-or-self::` | Para baixo | Descendentes + atual | `//div/descendant-or-self::*` |
| `self::` | Atual | Apenas o nó atual | `//div/self::div` |
| `attribute::` | Atributo | Atributos do atual | `//div/attribute::class` |

!!! info "Sintaxe Abreviada"
    - `//div` é abreviação de `//descendant-or-self::div`
    - `//div/p` é abreviação de `//div/child::p`
    - `@id` é abreviação de `attribute::id`
    - `..` é abreviação de `parent::node()`

### Exemplos Práticos de Eixos

```python
# Navegar para o pai
await tab.query("//input[@name='email']/parent::div")
await tab.query("//span[@class='error']/..")       # Abreviação

# Encontrar ancestral
await tab.query("//input/ancestor::form")          # Primeiro <form> ancestral
await tab.query("//button/ancestor::div[@class='modal']")

# Navegação entre irmãos
await tab.query("//label[text()='Email:']/following-sibling::input")
await tab.query("//h2/following-sibling::p[1]")    # Primeiro <p> após <h2>
await tab.query("//h2/following-sibling::p", find_all=True)  # Todos os <p> após <h2>
await tab.query("//button/preceding-sibling::input[last()]")

# Relacionamentos complexos
await tab.query("//tr/td[1]/following-sibling::td[2]")  # 3ª célula na primeira linha
await tab.query("//tr/td[1]/following-sibling::td[2]", find_all=True)  # 3ª célula em todas as linhas
```

## Funções XPath

### Funções de Texto

```python
# Correspondência exata de texto
await tab.query("//button[text()='Submit']")

# Contém texto
await tab.query("//p[contains(text(), 'welcome')]")

# Começa com
await tab.query("//a[starts-with(@href, 'https://')]")

# Normalização de texto (remove espaços em branco extras)
await tab.query("//button[normalize-space(text())='Submit']")

# Comprimento da string
await tab.query("//input[string-length(@value) > 5]")

# Concatenação
await tab.query("//div[concat(@data-first, @data-last)='JohnDoe']")
```

### Funções Numéricas

```python
# Correspondência de posição
await tab.query("//li[position()=1]")              # Primeiro <li>
await tab.query("//li[position() > 3]", find_all=True)  # Todos os <li> após o 3º
await tab.query("//li[last()]")                    # Último <li>
await tab.query("//li[last()-1]")                  # Penúltimo

# Contagem
await tab.query("//ul[count(li) > 5]")             # Primeiro <ul> com mais de 5 itens
await tab.query("//ul[count(li) > 5]", find_all=True)  # Todos os <ul> com > 5 itens

# Operações numéricas
await tab.query("//div[@data-price > 100]")        # Primeiro div com preço > 100
await tab.query("//div[@data-price > 100]", find_all=True)  # Todos os divs
await tab.query("//div[number(@data-stock) = 0]")  # Primeiro com estoque = 0
```

### Funções Booleanas

```python
# Lógica booleana
await tab.query("//div[@visible='true' and @enabled='true']")  # Primeira correspondência
await tab.query("//input[@type='text' or @type='email']")  # Primeiro text ou email
await tab.query("//input[@type='text' or @type='email']", find_all=True)  # Todos
await tab.query("//button[not(@disabled)]")        # Primeiro botão habilitado
await tab.query("//button[not(@disabled)]", find_all=True)  # Todos os botões habilitados

# Verificações de existência
await tab.query("//div[child::p]")                 # Primeiro div com filhos <p>
await tab.query("//div[child::p]", find_all=True)  # Todos os divs com filhos <p>
await tab.query("//div[not(child::*)]")            # Primeiro div vazio
await tab.query("//div[not(child::*)]", find_all=True)  # Todos os divs vazios
```

## Predicados XPath

Predicados filtram conjuntos de nós usando condições entre colchetes `[]`.

```python
# Predicados de posição
await tab.query("(//div)[1]")                      # Primeiro <div> no documento
await tab.query("(//div)[last()]")                 # Último <div> no documento
await tab.query("//ul/li[3]")                      # Primeiro 3º <li> em um <ul>
await tab.query("//ul/li[3]", find_all=True)       # Todos os 3º <li> em cada <ul>

# Múltiplos predicados (lógica E)
await tab.query("//input[@type='text'][@required]")  # Primeira correspondência
await tab.query("//div[@class='product'][position() < 4]", find_all=True)  # Os 3 primeiros

# Predicados de atributo
await tab.query("//div[@data-id='123']")
await tab.query("//a[contains(@class, 'button')]")  # Primeiro link correspondente
await tab.query("//input[starts-with(@name, 'user')]")  # Primeiro input correspondente
```

## Exemplos do Mundo Real: Localização Complexa de Elementos

Vamos trabalhar com uma estrutura HTML realista para demonstrar seletores avançados.

### Estrutura HTML de Exemplo

```html
<div class="dashboard">
    <header>
        <h1>User Dashboard</h1>
        <nav class="menu">
            <a href="/home" class="active">Home</a>
            <a href="/profile">Profile</a>
            <a href="/settings">Settings</a>
        </nav>
    </header>
    
    <main>
        <section class="products">
            <h2>Available Products</h2>
            <table id="products-table">
                <thead>
                    <tr>
                        <th>Product Name</th>
                        <th>Price</th>
                        <th>Stock</th>
                        <th>Actions</th>
                    </tr>
                </thead>
                <tbody>
                    <tr data-product-id="101">
                        <td>Laptop</td>
                        <td class="price">$999</td>
                        <td class="stock">15</td>
                        <td>
                            <button class="btn-edit">Edit</button>
                            <button class="btn-delete">Delete</button>
                        </td>
                    </tr>
                    <tr data-product-id="102">
                        <td>Mouse</td>
                        <td class="price">$25</td>
                        <td class="stock">0</td>
                        <td>
                            <button class="btn-edit">Edit</button>
                            <button class="btn-delete" disabled>Delete</button>
                        </td>
                    </tr>
                    <tr data-product-id="103">
                        <td>Keyboard</td>
                        <td class="price">$75</td>
                        <td class="stock">8</td>
                        <td>
                            <button class="btn-edit">Edit</button>
                            <button class="btn-delete">Delete</button>
                        </td>
                    </tr>
                </tbody>
            </table>
        </section>
        
        <section class="user-form">
            <h2>User Information</h2>
            <form id="user-form">
                <div class="form-group">
                    <label for="username">Username:</label>
                    <input type="text" id="username" name="username" required>
                    <span class="error-message" style="display:none;">Invalid username</span>
                </div>
                <div class="form-group">
                    <label for="email">Email:</label>
                    <input type="email" id="email" name="email" required>
                    <span class="error-message" style="display:none;">Invalid email</span>
                </div>
                <div class="form-group">
                    <input type="checkbox" id="newsletter" name="newsletter">
                    <label for="newsletter">Subscribe to newsletter</label>
                </div>
                <button type="submit" class="btn-primary">Save Changes</button>
                <button type="button" class="btn-secondary">Cancel</button>
            </form>
        </section>
    </main>
</div>
```

### Desafio 1: Encontrar Link de Navegação Ativo

**Objetivo**: Encontrar o link de navegação atualmente ativo.

```python
# Seletor CSS
active_link = await tab.query("nav.menu a.active")

# XPath
active_link = await tab.query("//nav[@class='menu']//a[@class='active']")

# Obter seu texto
text = await active_link.text
print(text)  # "Home"
```

### Desafio 2: Encontrar Botão de Edição para Produto Específico

**Objetivo**: Encontrar o botão "Edit" para o produto "Mouse" (sem saber sua posição na linha).

```python
# XPath (recomendado para este caso)
edit_button = await tab.query(
    "//tr[td[text()='Mouse']]//button[contains(@class, 'btn-edit')]"
)

# Alternativa: Usando following-sibling
edit_button = await tab.query(
    "//td[text()='Mouse']/following-sibling::td//button[@class='btn-edit']"
)
```

!!! tip "Por que XPath Aqui?"
    Seletores CSS não podem atravessar para cima para encontrar a linha e depois para baixo até o botão. A habilidade do XPath de se mover livremente pelo DOM torna isso trivial.

### Desafio 3: Encontrar Todos os Produtos com Preço Acima de $50

**Objetivo**: Obter todas as linhas da tabela onde o preço é maior que $50.

```python
# XPath com comparação numérica
expensive_products = await tab.query(
    "//tr[number(translate(td[@class='price'], '$,', '')) > 50]",
    find_all=True
)

# Versão mais legível: usando contains para casos mais simples
# Isso encontra produtos com preço contendo valores específicos
products = await tab.query("//tr[contains(td[@class='price'], '$75')]", find_all=True)
```

!!! note "Conversão de Texto para Número"
    A função `translate()` remove os caracteres `$` e `,`, então `number()` converte para numérico para comparação.

### Desafio 4: Encontrar Todos os Produtos Fora de Estoque

**Objetivo**: Encontrar todos os produtos onde o estoque é 0.

```python
# XPath
out_of_stock = await tab.query(
    "//tr[td[@class='stock' and text()='0']]",
    find_all=True
)

# Alternativa: Encontrar todas as linhas e checar o estoque
rows = await tab.query("//tbody/tr[td[@class='stock']/text()='0']", find_all=True)
```

### Desafio 5: Encontrar Campo de Input pelo Seu Label

**Objetivo**: Encontrar o input de email localizando seu label primeiro.

```python
# XPath usando atributo 'for' do label
email_input = await tab.query("//label[text()='Email:']/following-sibling::input")

# Alternativa: Usando o atributo for
email_input = await tab.query("//input[@id=(//label[text()='Email:']/@for)]")

# Mais genérico: Encontrar pelo texto do label
username_input = await tab.query(
    "//label[contains(text(), 'Username')]/following-sibling::input"
)
```

### Desafio 6: Encontrar Mensagem de Erro Próxima ao Campo de Email

**Objetivo**: Obter o span de mensagem de erro que aparece ao lado do input de email.

```python
# XPath - encontrar irmão de erro do input de email
error_span = await tab.query(
    "//input[@id='email']/following-sibling::span[@class='error-message']"
)

# Alternativa: Navegar a partir da div pai
error_span = await tab.query(
    "//input[@id='email']/parent::div//span[@class='error-message']"
)

# Checar visibilidade
is_visible = await error_span.is_visible()
```

### Desafio 7: Encontrar Botão de Envio (Não o de Cancelar)

**Objetivo**: Encontrar o botão de envio, excluindo o botão de cancelar.

```python
# Seletor CSS (simples)
submit_button = await tab.query("button[type='submit']")
submit_button = await tab.query("button.btn-primary")

# XPath com texto
submit_button = await tab.query("//button[text()='Save Changes']")

# XPath excluindo outros
submit_button = await tab.query(
    "//button[@type='submit' and not(@class='btn-secondary')]"
)
```

### Desafio 8: Encontrar Todos os Campos Obrigatórios do Formulário

**Objetivo**: Obter todos os campos de input obrigatórios no formulário.

```python
# Seletor CSS (limpo)
required_fields = await tab.query(
    "#user-form input[required]",
    find_all=True
)

# XPath
required_fields = await tab.query(
    "//form[@id='user-form']//input[@required]",
    find_all=True
)

# Verificar
for field in required_fields:
    field_name = await field.get_attribute("name")
    print(f"Obrigatório: {field_name}")
```

### Desafio 9: Encontrar Primeiro Botão de Deletar Não Desabilitado

**Objetivo**: Encontrar o primeiro botão de deletar que não está desabilitado.

```python
# Seletor CSS
first_enabled_delete = await tab.query("button.btn-delete:not([disabled])")

# XPath
first_enabled_delete = await tab.query(
    "//button[contains(@class, 'btn-delete') and not(@disabled)]"
)

# Obter todos os botões de deletar habilitados
all_enabled = await tab.query(
    "//button[@class='btn-delete' and not(@disabled)]",
    find_all=True
)
```

### Desafio 10: Encontrar Linha da Tabela por Múltiplas Condições

**Objetivo**: Encontrar produtos com estoque > 0 E preço < $100.

```python
# XPath com lógica complexa
available_affordable = await tab.query(
    """
    //tr[
        number(td[@class='stock']) > 0 
        and 
        number(translate(td[@class='price'], '$', '')) < 100
    ]
    """,
    find_all=True
)

# Para cada produto correspondente
for row in available_affordable:
    cells = await row.query("td", find_all=True)
    product_name = await cells[0].text
    print(f"Disponível: {product_name}")
```

### Desafio 11: Navegar em Relacionamentos Complexos

**Objetivo**: A partir de um botão de deletar, obter o nome do produto na mesma linha.

```python
# Começar com um botão de deletar
delete_button = await tab.query("//tr[@data-product-id='101']//button[@class='btn-delete']")

# Navegar para a linha pai, depois para a primeira célula
product_name_cell = await delete_button.query("./ancestor::tr/td[1]")
product_name = await product_name_cell.text
print(product_name)  # "Laptop"

# Alternativa: Obter a linha inteira primeiro
row = await delete_button.query("./ancestor::tr")
product_id = await row.get_attribute("data-product-id")
print(product_id)  # "101"
```

### Desafio 12: Encontrar Checkbox e Seu Label Juntos

**Objetivo**: Encontrar o checkbox da newsletter e verificar seu label.

```python
# Encontrar checkbox
checkbox = await tab.query("#newsletter")

# Obter label associado usando atributo 'for'
label = await tab.query("//label[@for='newsletter']")
label_text = await label.text
print(label_text)  # "Subscribe to newsletter"

# Alternativa: Navegar do checkbox para o label
label = await checkbox.query("//following::label[@for='newsletter']")

# Checar se está marcado
is_checked = await checkbox.is_checked()
```

## Padrão Avançado: Construção Dinâmica de Seletor

Ao lidar com conteúdo dinâmico, você pode precisar construir seletores programaticamente:

```python
async def find_product_by_name(tab, product_name: str):
    """Encontra uma linha de produto pelo nome dinamicamente."""
    # Escapar aspas no nome do produto para prevenir injeção de XPath
    safe_name = product_name.replace("'", "\\'")
    
    xpath = f"//tr[td[text()='{safe_name}']]"
    return await tab.query(xpath)

async def find_table_cell(tab, row_text: str, column_index: int):
    """Encontra uma célula específica pelo conteúdo da linha e posição da coluna."""
    xpath = f"//tr[td[contains(text(), '{row_text}')]]/td[{column_index}]"
    return await tab.query(xpath)

# Uso
product_row = await find_product_by_name(tab, "Laptop")
price_cell = await find_table_cell(tab, "Laptop", 2)
price = await price_cell.text
print(price)  # "$999"
```

## Comparação de Desempenho

```python
import asyncio
import time

async def benchmark_selectors(tab):
    """Comparar desempenho de CSS vs XPath."""
    
    # Aquecimento
    await tab.query("#products-table")
    
    # Benchmark CSS
    start = time.time()
    for _ in range(100):
        await tab.query("#products-table tbody tr", find_all=True)
    css_time = time.time() - start
    
    # Benchmark XPath
    start = time.time()
    for _ in range(100):
        await tab.query("//table[@id='products-table']//tbody//tr", find_all=True)
    xpath_time = time.time() - start
    
    print(f"CSS: {css_time:.3f}s")
    print(f"XPath: {xpath_time:.3f}s")
    print(f"CSS é {xpath_time/css_time:.2f}x mais rápido")

# Resultados típicos: CSS é 1.2-1.5x mais rápido para seletores simples
```

!!! warning "Desempenho vs Legibilidade"
    Embora seletores CSS sejam geralmente mais rápidos, a diferença é usualmente negligenciável (milissegundos) para consultas individuais. Escolha o seletor que torna seu código mais legível e sustentável, especialmente para relacionamentos complexos onde o XPath se destaca.

## Melhores Práticas de Seletores

### 1. Prefira Seletores Estáveis

```python
# Bom: Usando atributos semânticos
await tab.query("#user-email")
await tab.query("[data-testid='submit-button']")
await tab.query("input[name='username']")

# Evite: Seletores frágeis baseados na estrutura
await tab.query("div > div > div:nth-child(3) > input")
await tab.query("body > div:nth-child(2) > form > div:first-child")
```

### 2. Use o Seletor Mais Simples que Funciona

```python
# Bom: Simples e eficiente
await tab.query("#login-form")
await tab.query(".submit-button")

# Evite: Complicado demais quando desnecessário
await tab.query("//div[@id='content']/descendant::form[@id='login-form']")
```

### 3. Combine find() e query() Apropriadamente

```python
# Use find() para correspondência simples de atributos
username = await tab.find(id="username")
submit = await tab.find(tag_name="button", type="submit")

# Use query() para padrões complexos
active_link = await tab.query("nav.menu a.active")
error_msg = await tab.query("//input[@name='email']/following-sibling::span[@class='error']")
```

### 4. Adicione Comentários para Seletores Complexos

```python
# Encontrar o botão "Edit" na linha que contém o produto "Laptop"
# XPath: Navega para a linha com texto "Laptop", depois encontra o botão de edição
edit_button = await tab.query(
    "//tr[td[text()='Laptop']]//button[@class='btn-edit']"
)
```

## Conclusão

Ao entender tanto seletores CSS quanto XPath, juntamente com suas respectivas forças e casos de uso, você pode criar uma automação de navegador robusta e sustentável que lida com as complexidades das aplicações web modernas. Lembre-se:

- **Use seletores CSS** para seleções simples e críticas de desempenho
- **Use XPath** para relacionamentos complexos, correspondência de texto e navegação ascendente
- **Escolha estabilidade** em vez de brevidade ao escrever seletores
- **Comente consultas complexas** para manter a legibilidade do código

================================================
FILE: docs/pt/deep-dive/index.md
================================================
# Análise Profunda: Fundamentos Técnicos

**Bem-vindo ao coração técnico do Pydoll, onde exploramos os sistemas e protocolos que impulsionam a automação de navegadores.**

Esta seção fornece educação técnica abrangente sobre web scraping, automação de navegadores, protocolos de rede e técnicas anti-detecção. Em vez de focar apenas em padrões de uso, exploramos os mecanismos subjacentes, desde o primeiro pacote TCP até o pixel final renderizado.

## O que Torna Isto Diferente

A maioria das documentações de automação ensina **como usar uma ferramenta**. Esta seção ensina **como a internet realmente funciona**, e como manipulá-la em cada camada:

- **Protocolos de rede** (TCP/IP, TLS, HTTP/2) - A fundação invisível de cada requisição
- **Componentes internos do navegador** (CDP, motores de renderização, contextos JavaScript) - O que acontece dentro do Chrome
- **Sistemas de detecção** (fingerprinting, análise comportamental, detecção de proxy) - Como os sites identificam bots
- **Técnicas de evasão** (sobrescritas de CDP, aplicação de consistência, imitação humana) - Como se tornar indetectável

!!! quote "Filosofia"
    **"Qualquer tecnologia suficientemente avançada é indistinguível da mágica."**
    
    Esta seção visa desmistificar a automação de navegadores explicando os sistemas subjacentes. Entender esses fundamentos proporciona melhor controle e previsibilidade em seu trabalho de automação.

## A Arquitetura do Conhecimento

Esta seção está organizada em **cinco camadas progressivas**, cada uma construindo sobre a anterior:

### Fundamentos Essenciais
**[→ Explore os Fundamentos](./fundamentals/cdp.md)**

Comece pela base: entenda os protocolos e sistemas que impulsionam o Pydoll.

- **[Chrome DevTools Protocol](./fundamentals/cdp.md)** - Como o Pydoll conversa com os navegadores, contornando o WebDriver
- **[Camada de Conexão](./fundamentals/connection-layer.md)** - Arquitetura WebSocket, padrões assíncronos, CDP em tempo real
- **[Sistema de Tipos do Python](./fundamentals/typing-system.md)** - Segurança de tipos, TypedDict para CDP, integração com IDE

**Por que começar aqui**: Entender o CDP e a comunicação assíncrona fornece a base para compreender todos os outros aspectos da automação de navegadores.

---

### Arquitetura Interna
**[→ Explore a Arquitetura](./architecture/browser-domain.md)**

Suba para o próximo nível: entenda como os componentes internos do Pydoll trabalham juntos.

- **[Domínio do Navegador (Browser)](./architecture/browser-domain.md)** - Gerenciamento de processos, contextos, automação multi-perfil
- **[Domínio da Aba (Tab)](./architecture/tab-domain.md)** - Ciclo de vida da aba, operações concorrentes, manipulação de iframes
- **[Domínio do WebElement](./architecture/webelement-domain.md)** - Interações de elementos, shadow DOM, manipulação de atributos
- **[Mixin FindElements](./architecture/find-elements-mixin.md)** - Estratégias de seletores, travessia do DOM, otimização
- **[Arquitetura de Eventos](./architecture/event-architecture.md)** - Sistema de eventos reativo, callbacks, despacho assíncrono
- **[Arquitetura de Requisições do Navegador](./architecture/browser-requests-architecture.md)** - HTTP no contexto do navegador

**Por que isso importa**: Entender a arquitetura interna revela oportunidades de otimização e padrões de design que não são aparentes no uso superficial.

---

### Rede e Segurança
**[→ Explore Rede e Segurança](./network/index.md)**

Desça para a camada de protocolo: entenda como os dados fluem pela internet.

- **[Fundamentos de Rede](./network/network-fundamentals.md)** - Modelo OSI, TCP/UDP, vazamento de WebRTC
- **[Proxies HTTP/HTTPS](./network/http-proxies.md)** - Proxy de camada de aplicação, tunelamento CONNECT
- **[Proxies SOCKS](./network/socks-proxies.md)** - Proxy de camada de sessão, suporte UDP, segurança
- **[Detecção de Proxy](./network/proxy-detection.md)** - Níveis de anonimato, técnicas de detecção, evasão
- **[Construindo Servidores Proxy](./network/build-proxy.md)** - Implementações completas de HTTP e SOCKS5
- **[Questões Legais e Éticas](./network/proxy-legal.md)** - GDPR, CFAA, conformidade, uso responsável

**Visão crítica**: Características de rede são determinadas no nível do SO. Incompatibilidades entre a identidade do navegador declarada e os fingerprints de nível de rede podem ser detectadas por sistemas anti-bot sofisticados.

---

### Fingerprinting (Impressão Digital)
**[→ Explore Fingerprinting](./fingerprinting/index.md)**

Entendendo sistemas de detecção e técnicas de evasão para automação de navegadores.

- **[Network Fingerprinting](./fingerprinting/network-fingerprinting.md)** - TCP/IP, TLS/JA3, p0f, Nmap, Scapy
- **[Browser Fingerprinting](./fingerprinting/browser-fingerprinting.md)** - HTTP/2, Canvas, WebGL, APIs JavaScript
- **[Técnicas de Evasão](./fingerprinting/evasion-techniques.md)** - Sobrescritas de CDP, consistência, código prático

**Visão chave**: Cada conexão revela numerosas características (renderização de canvas, tamanho da janela TCP, ordem de cifras TLS). Furtividade eficaz requer consistência em todas as camadas de detecção.

---

### Guias Práticos
**[→ Explore os Guias](./guides/selectors-guide.md)**

Aplique seu conhecimento: guias práticos para desafios comuns de automação.

- **[Seletores CSS vs XPath](./guides/selectors-guide.md)** - Sintaxe de seletores, desempenho, melhores práticas

**Em breve**: Mais guias práticos sintetizando o conhecimento técnico em padrões acionáveis.

---

## Trilhas de Aprendizagem

Objetivos diferentes exigem conhecimentos diferentes. Escolha sua trilha:

### Trilha 1: Automação Furtiva (Stealth)
**Objetivo: Construir scrapers indetectáveis**

1.  **[Visão Geral de Fingerprinting](./fingerprinting/index.md)** - Entenda o cenário de detecção
2.  **[Network Fingerprinting](./fingerprinting/network-fingerprinting.md)** - Assinaturas TCP/IP, TLS
3.  **[Browser Fingerprinting](./fingerprinting/browser-fingerprinting.md)** - Canvas, WebGL, HTTP/2
4.  **[Técnicas de Evasão](./fingerprinting/evasion-techniques.md)** - Contramedidas baseadas em CDP
5.  **[Rede e Segurança](./network/index.md)** - Seleção e configuração de proxy
6.  **[Domínio do Navegador (Browser)](./architecture/browser-domain.md)** - Isolamento de contexto, gerenciamento de processos

**Investimento de tempo**: 12-16 horas de aprendizado técnico profundo
**Recompensa**: Capacidade de contornar sistemas anti-bot sofisticados

---

### Trilha 2: Maestria em Arquitetura
**Objetivo: Contribuir para o Pydoll ou construir ferramentas similares**

1.  **[Análise Profunda do CDP](./fundamentals/cdp.md)** - Fundamentos do protocolo
2.  **[Camada de Conexão](./fundamentals/connection-layer.md)** - Padrões assíncronos WebSocket
3.  **[Arquitetura de Eventos](./architecture/event-architecture.md)** - Design orientado a eventos
4.  **[Domínio do Navegador (Browser)](./architecture/browser-domain.md)** - Gerenciamento do navegador
5.  **[Domínio da Aba (Tab)](./architecture/tab-domain.md)** - Ciclo de vida da aba
6.  **[Domínio do WebElement](./architecture/webelement-domain.md)** - Interação de elementos
7.  **[Sistema de Tipos do Python](./fundamentals/typing-system.md)** - Integração de segurança de tipos

**Investimento de tempo**: 16-20 horas de estudo arquitetural
**Recompensa**: Entendimento profundo dos componentes internos da automação de navegadores

---

### Trilha 3: Engenharia de Rede
**Objetivo: Dominar proxies, fingerprinting e furtividade em nível de rede**

1.  **[Fundamentos de Rede](./network/network-fundamentals.md)** - Modelo OSI, TCP/UDP, WebRTC
2.  **[Network Fingerprinting](./fingerprinting/network-fingerprinting.md)** - Assinaturas TCP/IP, TLS/JA3
3.  **[Proxies HTTP/HTTPS](./network/http-proxies.md)** - Proxy de camada de aplicação
4.  **[Proxies SOCKS](./network/socks-proxies.md)** - Proxy de camada de sessão
5.  **[Detecção de Proxy](./network/proxy-detection.md)** - Anonimato e evasão
6.  **[Construindo Servidores Proxy](./network/build-proxy.md)** - Implementação do zero

**Investimento de tempo**: 14-18 horas de estudo de protocolos de rede
**Recompensa**: Entendimento completo de anonimato e detecção em nível de rede

---

## Pré-requisitos

Este é um material técnico **avançado**. Os pré-requisitos recomendados incluem:

- **Fundamentos de Python** - Classes, async/await, gerenciadores de contexto, decoradores
- **Redes básicas** - Endereços IP, portas, protocolo HTTP
- **Básico de Pydoll** - Veja [Funcionalidades](../features/core-concepts.md) e [Começando](../index.md)
- **Browser DevTools** - Inspetor do Chrome, aba Rede, Console

**Se você é novo nisso**, recomendamos:
1.  Completar a seção [Funcionalidades](../features/index.md) primeiro
2.  Praticar automação básica com o Pydoll
3.  Retornar aqui quando precisar de um entendimento mais profundo

## A Filosofia da Maestria

Automação web envolve múltiplas áreas de especialização:

- **Engenharia de protocolos** - Entender TCP/IP, TLS, HTTP/2
- **Programação de sistemas** - Gerenciar processos, I/O assíncrono, WebSockets
- **Pesquisa em segurança** - Fingerprinting, detecção, evasão
- **Componentes internos do navegador** - Renderização, contextos JavaScript, CDP
- **Segurança operacional** - Conformidade legal, diretrizes éticas

A maioria dos desenvolvedores aprende isso independentemente, ao longo do tempo. Esta seção consolida esse conhecimento ao:

1.  **Centralizar conhecimento** - Chega de posts de blog espalhados e artigos acadêmicos
2.  **Fornecer contexto** - Cada técnica explicada desde os primeiros princípios
3.  **Oferecer código funcional** - Todos os exemplos estão prontos para produção
4.  **Citar fontes** - Cada alegação é apoiada por RFCs, documentação ou pesquisa
5.  **Complexidade progressiva** - Cada seção constrói sobre o conhecimento anterior

## Padrões da Documentação

Esta documentação representa extensa pesquisa, testes e validação:

- Cada detalhe de protocolo verificado contra RFCs
- Cada técnica de fingerprinting testada em produção
- Cada exemplo de código roda sem modificação
- Cada alegação citada com fontes autoritativas
- Cada diagrama gerado a partir do comportamento real do sistema

Precisão técnica e aplicabilidade prática são priorizadas em todo o conteúdo.

## Uso Ético

Com este conhecimento vem a responsabilidade:

!!! danger "Use com Responsabilidade"
    As técnicas descritas aqui podem servir tanto para automação legítima quanto para fins maliciosos. O uso responsável inclui:
    
    - Respeitar os termos de serviço dos sites e o robots.txt
    - Implementar limitação de taxa (rate limiting) e rastreamento respeitoso
    - Considerar se a automação é realmente necessária
    - Consultar aconselhamento jurídico em caso de incerteza
    - Ser transparente sobre sua automação quando apropriado
    
    Evite usar este conhecimento para:
    - Fraude, abuso de contas ou atividades ilegais
    - Sobrecarregar servidores com scraping agressivo
    - Atividades prejudiciais sem entender as consequências

Para orientação detalhada, veja **[Considerações Legais e Éticas](./network/proxy-legal.md)**.

## Contribuindo

Encontrou um erro? Tem uma sugestão? Viu algo desatualizado?

Esta documentação é um **projeto vivo**. Técnicas de fingerprinting evoluem, protocolos atualizam e novos métodos de evasão emergem. Aceitamos contribuições que:

- Corrijam imprecisões técnicas
- Adicionem novas técnicas de fingerprinting
- Atualizem informações de protocolo
- Melhorem exemplos de código
- Expandam a cobertura de sistemas de detecção

Veja [Contribuindo](../CONTRIBUTING.md) para diretrizes de submissão.

---

## Começando

Escolha uma trilha com base em seus objetivos:

**Novo em conteúdo técnico profundo?**
→ Comece com **[Chrome DevTools Protocol](./fundamentals/cdp.md)** para entender a fundação do Pydoll

**Precisa de automação furtiva?**
→ Pule para **[Fingerprinting](./fingerprinting/index.md)** para técnicas de detecção e evasão

**Quer controle em nível de rede?**
→ Explore **[Rede e Segurança](./network/index.md)** para arquitetura de proxy e protocolos

**Construindo infraestrutura de automação?**
→ Estude **[Arquitetura Interna](./architecture/browser-domain.md)** para padrões de design

**Só quer dar uma olhada?**
→ Escolha qualquer tópico da barra lateral, cada artigo é autocontido

---

!!! success "Análise Profunda Técnica"
    Esta seção fornece conhecimento técnico abrangente para automação de navegadores, desde protocolos fundamentais até técnicas avançadas de evasão.
    
    Explore no seu próprio ritmo.

================================================
FILE: docs/pt/deep-dive/network/build-proxy.md
================================================
# Construindo Servidores Proxy

Este documento implementa servidores proxy HTTP e SOCKS5 do zero em Python usando asyncio. O objetivo não é prontidão para produção, mas compreensão de protocolo: ver como cada byte é analisado, onde estão os limites de segurança e por que certas decisões de design existem em software proxy real.

!!! info "Navegação do Módulo"
    - [Fundamentos de Rede](./network-fundamentals.md): TCP/IP, UDP, WebRTC
    - [Proxies HTTP/HTTPS](./http-proxies.md): Proxy na camada de aplicação
    - [Proxies SOCKS](./socks-proxies.md): Proxy na camada de sessão
    - [Detecção de Proxy](./proxy-detection.md): Técnicas de detecção e evasão

    Para uso prático de proxy no Pydoll, veja [Configuração de Proxy](../../features/configuration/proxy.md).

!!! warning "Código Educacional"
    Estas implementações priorizam clareza sobre robustez. Elas não possuem limites de conexão, listas de controle de acesso e muitos caminhos de recuperação de erro que um proxy de produção requer. Não as exponha a redes não confiáveis.

## Proxy HTTP

Um proxy HTTP opera em dois modos. Para HTTP em texto plano, ele recebe a requisição completa (com uma URL em formato absoluto como `GET http://example.com/path HTTP/1.1`), reescreve o request-target para formato de origem (`GET /path HTTP/1.1`), conecta ao servidor destino, encaminha a requisição e retorna a resposta. Para HTTPS, o cliente envia uma requisição `CONNECT host:port`, o proxy abre uma conexão TCP para o destino, responde com `200 Connection Established`, e então retransmite bytes cegamente em ambas as direções sem inspecionar o conteúdo criptografado.

A implementação abaixo lida com ambos os modos. Algumas coisas para notar enquanto lê. O método `_pipe_data` chama `write_eof()` quando um lado fecha, que envia um TCP FIN para o outro lado. Sem isso, o túnel fica pendurado indefinidamente porque o outro `read()` nunca retorna bytes vazios. O caminho de encaminhamento HTTP usa a mesma abordagem de piping em vez de uma única chamada `read()`, porque respostas HTTP podem ser arbitrariamente grandes e um read de tamanho fixo as truncaria silenciosamente. A reescrita do request-target preserva query strings, que `urlparse().path` sozinho descartaria.

```python
import asyncio
import base64
import contextlib
import logging
from urllib.parse import urlparse

logger = logging.getLogger(__name__)


class HTTPProxy:
    """Proxy HTTP/HTTPS assíncrono com autenticação Basic opcional."""

    def __init__(self, host='0.0.0.0', port=8080, username=None, password=None):
        self.host = host
        self.port = port
        self.username = username
        self.password = password

    async def start(self):
        server = await asyncio.start_server(
            self._handle_client, self.host, self.port
        )
        logger.info(f'HTTP proxy listening on {self.host}:{self.port}')
        async with server:
            await server.serve_forever()

    async def _handle_client(self, reader, writer):
        try:
            request_line = await asyncio.wait_for(
                reader.readline(), timeout=30
            )
            if not request_line:
                return

            parts = request_line.decode('latin-1').split()
            if len(parts) != 3:
                writer.write(b'HTTP/1.1 400 Bad Request\r\n\r\n')
                await writer.drain()
                return

            method, url, _ = parts
            headers = await self._read_headers(reader)

            if not self._check_auth(headers):
                writer.write(
                    b'HTTP/1.1 407 Proxy Authentication Required\r\n'
                    b'Proxy-Authenticate: Basic realm="Proxy"\r\n'
                    b'Content-Length: 0\r\n\r\n'
                )
                await writer.drain()
                return

            if method == 'CONNECT':
                await self._handle_connect(url, reader, writer)
            else:
                await self._handle_http(method, url, headers, reader, writer)
        except Exception as e:
            logger.error(f'Client handler error: {e}')
        finally:
            writer.close()
            await writer.wait_closed()

    async def _read_headers(self, reader):
        headers = {}
        while True:
            line = await reader.readline()
            if line in (b'\r\n', b'\n', b''):
                break
            if b':' in line:
                key, value = line.decode('latin-1').split(':', 1)
                headers[key.strip().lower()] = value.strip()
        return headers

    def _check_auth(self, headers):
        if not self.username:
            return True
        auth = headers.get('proxy-authorization', '')
        if not auth.startswith('Basic '):
            return False
        try:
            decoded = base64.b64decode(auth[6:]).decode('utf-8')
            if ':' not in decoded:
                return False
            user, pwd = decoded.split(':', 1)
            return user == self.username and pwd == self.password
        except Exception:
            return False

    async def _handle_connect(self, target, client_reader, client_writer):
        """Estabelece um túnel TCP cego para HTTPS."""
        # Analisa host:port, lidando com literais IPv6 como [::1]:443
        if target.startswith('['):
            bracket_end = target.index(']')
            host = target[1:bracket_end]
            port = int(target[bracket_end + 2:])
        elif ':' in target:
            host, port_str = target.rsplit(':', 1)
            port = int(port_str)
        else:
            client_writer.write(b'HTTP/1.1 400 Bad Request\r\n\r\n')
            await client_writer.drain()
            return

        try:
            server_reader, server_writer = await asyncio.open_connection(
                host, port
            )
        except OSError as e:
            logger.error(f'CONNECT failed to {host}:{port}: {e}')
            client_writer.write(b'HTTP/1.1 502 Bad Gateway\r\n\r\n')
            await client_writer.drain()
            return

        client_writer.write(b'HTTP/1.1 200 Connection Established\r\n\r\n')
        await client_writer.drain()

        await asyncio.gather(
            self._pipe(client_reader, server_writer),
            self._pipe(server_reader, client_writer),
        )

    async def _handle_http(self, method, url, headers, client_reader, client_writer):
        """Encaminha uma requisição HTTP em texto plano."""
        parsed = urlparse(url)
        host = parsed.hostname
        port = parsed.port or 80

        # Preserva query string no request-target
        path = parsed.path or '/'
        if parsed.query:
            path += f'?{parsed.query}'

        try:
            server_reader, server_writer = await asyncio.open_connection(
                host, port
            )
        except OSError as e:
            logger.error(f'HTTP forward failed to {host}:{port}: {e}')
            client_writer.write(b'HTTP/1.1 502 Bad Gateway\r\n\r\n')
            await client_writer.drain()
            return

        # Reescreve request-target de formato absoluto para formato de origem
        request = f'{method} {path} HTTP/1.1\r\n'

        # Cabeçalho Host deve incluir a porta se for não-padrão
        if port != 80:
            request += f'Host: {host}:{port}\r\n'
        else:
            request += f'Host: {host}\r\n'

        # Remove cabeçalhos hop-by-hop que não devem ser encaminhados
        hop_by_hop = {
            'proxy-authorization', 'proxy-connection',
            'connection', 'keep-alive', 'te', 'trailer', 'upgrade',
        }
        for key, value in headers.items():
            if key not in hop_by_hop:
                request += f'{key}: {value}\r\n'

        # Força Connection: close para que o servidor não mantenha keep-alive,
        # o que impediria o stream de resposta de terminar
        request += 'Connection: close\r\n\r\n'

        server_writer.write(request.encode('latin-1'))

        # Encaminha corpo da requisição se presente
        content_length = int(headers.get('content-length', 0))
        if content_length > 0:
            body = await client_reader.readexactly(content_length)
            server_writer.write(body)

        await server_writer.drain()

        # Retransmite a resposta inteira de volta (não um único read de tamanho fixo)
        while True:
            chunk = await server_reader.read(65536)
            if not chunk:
                break
            client_writer.write(chunk)
            await client_writer.drain()

        server_writer.close()
        await server_writer.wait_closed()

    async def _pipe(self, reader, writer):
        """Retransmissão bidirecional de dados com half-close adequado."""
        try:
            while True:
                data = await reader.read(8192)
                if not data:
                    break
                writer.write(data)
                await writer.drain()
        except (ConnectionResetError, BrokenPipeError, OSError):
            pass
        finally:
            with contextlib.suppress(Exception):
                if writer.can_write_eof():
                    writer.write_eof()
```

Alguns detalhes de protocolo que vale entender. Cabeçalhos HTTP são codificados como ISO-8859-1 (Latin-1), não UTF-8. Latin-1 mapeia cada valor de byte 0-255 para um caractere, então `decode('latin-1')` nunca levanta um `UnicodeDecodeError`, enquanto `decode('utf-8')` quebraria em certos valores de cabeçalho. O cabeçalho `Proxy-Authorization` usa codificação Base64, mas Base64 não é criptografia: as credenciais trafegam em texto claro (ou melhor, codificação trivialmente reversível) a menos que a conexão entre cliente e proxy esteja protegida por TLS. Os cabeçalhos hop-by-hop (`Connection`, `Keep-Alive`, `TE`, `Trailer`, `Upgrade`, `Proxy-Connection`) são destinados à conexão imediata entre dois nós, não para encaminhamento de ponta a ponta. A RFC 9110 Seção 7.6.1 requer que proxies os removam antes de encaminhar.

!!! warning "Risco de SSRF"
    Esta implementação não valida endereços de destino. Um cliente poderia solicitar `CONNECT 127.0.0.1:6379` para alcançar uma instância Redis local, ou `CONNECT 169.254.169.254:80` para acessar metadados de instância cloud (AWS, GCP, Azure). Qualquer proxy exposto a clientes não confiáveis deve validar destinos contra uma lista de negação de faixas privadas e link-local (`127.0.0.0/8`, `10.0.0.0/8`, `172.16.0.0/12`, `192.168.0.0/16`, `169.254.0.0/16`, `::1`, `fc00::/7`).

## Proxy SOCKS5

Um proxy SOCKS5 opera em um nível mais baixo que o HTTP. Ele usa um protocolo binário definido na RFC 1928, consistindo de três fases: negociação de método, autenticação opcional e a requisição de conexão. O proxy não analisa HTTP de forma alguma. Uma vez que o túnel é estabelecido, ele retransmite bytes brutos sem entender qual protocolo flui por ele.

A natureza binária do SOCKS5 significa que cada leitura deve receber exatamente o número esperado de bytes. TCP é um protocolo de stream e não garante que `read(4)` retorne 4 bytes: pode retornar 1, 2 ou 3 bytes dependendo das condições de rede. A implementação abaixo usa `readexactly()` do asyncio, que bufferiza internamente até que o número solicitado de bytes chegue ou a conexão feche (levantando `IncompleteReadError`).

```python
import asyncio
import contextlib
import struct
import logging

logger = logging.getLogger(__name__)


class SOCKS5Proxy:
    """Proxy SOCKS5 assíncrono com suporte a CONNECT e autenticação opcional (RFC 1928)."""

    VERSION = 0x05

    def __init__(self, host='0.0.0.0', port=1080, username=None, password=None):
        self.host = host
        self.port = port
        self.username = username
        self.password = password

    async def start(self):
        server = await asyncio.start_server(
            self._handle_client, self.host, self.port
        )
        logger.info(f'SOCKS5 proxy listening on {self.host}:{self.port}')
        async with server:
            await server.serve_forever()

    async def _handle_client(self, reader, writer):
        try:
            if not await self._negotiate_method(reader, writer):
                return
            if self.username and not await self._authenticate(reader, writer):
                return
            await self._handle_request(reader, writer)
        except (asyncio.IncompleteReadError, ConnectionResetError):
            pass
        except Exception as e:
            logger.error(f'SOCKS5 error: {e}')
        finally:
            writer.close()
            await writer.wait_closed()

    async def _negotiate_method(self, reader, writer):
        """Fase 1: cliente oferece métodos de autenticação, servidor escolhe um."""
        version = (await reader.readexactly(1))[0]
        if version != self.VERSION:
            return False

        nmethods = (await reader.readexactly(1))[0]
        methods = await reader.readexactly(nmethods)

        if self.username:
            if 0x02 not in methods:
                writer.write(bytes([self.VERSION, 0xFF]))
                await writer.drain()
                return False
            selected = 0x02
        else:
            selected = 0x00

        writer.write(bytes([self.VERSION, selected]))
        await writer.drain()
        return True

    async def _authenticate(self, reader, writer):
        """Fase 2: sub-negociação de usuário/senha (RFC 1929)."""
        auth_ver = (await reader.readexactly(1))[0]
        if auth_ver != 0x01:
            return False

        ulen = (await reader.readexactly(1))[0]
        username = (await reader.readexactly(ulen)).decode('utf-8')
        plen = (await reader.readexactly(1))[0]
        password = (await reader.readexactly(plen)).decode('utf-8')

        ok = username == self.username and password == self.password
        writer.write(bytes([0x01, 0x00 if ok else 0x01]))
        await writer.drain()
        return ok

    async def _handle_request(self, reader, writer):
        """Fase 3: analisa a requisição CONNECT e estabelece o túnel."""
        header = await reader.readexactly(4)
        version, command, _, atyp = header

        # Analisa endereço de destino baseado no tipo de endereço
        if atyp == 0x01:  # IPv4
            raw = await reader.readexactly(4)
            address = '.'.join(str(b) for b in raw)
        elif atyp == 0x03:  # Nome de domínio
            length = (await reader.readexactly(1))[0]
            address = (await reader.readexactly(length)).decode('ascii')
        elif atyp == 0x04:  # IPv6
            raw = await reader.readexactly(16)
            groups = [f'{raw[i]:02x}{raw[i+1]:02x}' for i in range(0, 16, 2)]
            address = ':'.join(groups)
        else:
            await self._reply(writer, 0x08)
            return

        port = struct.unpack('!H', await reader.readexactly(2))[0]
        logger.info(f'SOCKS5 CONNECT {address}:{port}')

        if command != 0x01:  # Apenas CONNECT é implementado
            await self._reply(writer, 0x07)
            return

        try:
            server_reader, server_writer = await asyncio.open_connection(
                address, port
            )
        except ConnectionRefusedError:
            await self._reply(writer, 0x05)
            return
        except OSError:
            await self._reply(writer, 0x04)
            return

        # BND.ADDR e BND.PORT devem refletir o endereço do socket local.
        # A maioria dos clientes ignora estes para CONNECT, mas preenchê-los
        # corretamente satisfaz a RFC 1928.
        local = server_writer.get_extra_info('sockname')
        await self._reply(writer, 0x00, local[0], local[1])

        await asyncio.gather(
            self._pipe(reader, server_writer),
            self._pipe(server_reader, writer),
        )

    async def _reply(self, writer, status, bind_addr='0.0.0.0', bind_port=0):
        """Envia uma resposta SOCKS5 com o status e endereço vinculado dados."""
        import socket
        try:
            packed_ip = socket.inet_aton(bind_addr)
            atyp = 0x01
        except OSError:
            packed_ip = socket.inet_aton('0.0.0.0')
            atyp = 0x01

        writer.write(bytes([
            self.VERSION, status, 0x00, atyp,
            *packed_ip,
            (bind_port >> 8) & 0xFF, bind_port & 0xFF,
        ]))
        await writer.drain()

    async def _pipe(self, reader, writer):
        try:
            while True:
                data = await reader.read(8192)
                if not data:
                    break
                writer.write(data)
                await writer.drain()
        except (ConnectionResetError, BrokenPipeError, OSError):
            pass
        finally:
            with contextlib.suppress(Exception):
                if writer.can_write_eof():
                    writer.write_eof()
```

Quando o tipo de endereço é `0x03` (nome de domínio), o proxy resolve DNS ele mesmo via `asyncio.open_connection()`. Esta é a propriedade de privacidade definidora do proxy SOCKS5: o cliente envia o nome de domínio em vez de resolvê-lo localmente, o que previne que consultas DNS vazem para a rede local do cliente. Este é o mesmo comportamento em que o Chrome se baseia quando configurado com `--proxy-server=socks5://...`, como discutido em [Proxies SOCKS](./socks-proxies.md).

O método `_reply` preenche `BND.ADDR` e `BND.PORT` com o endereço real do socket local após uma conexão bem-sucedida, como a RFC 1928 requer. Muitas implementações SOCKS5 retornam `0.0.0.0:0` aqui porque a maioria dos clientes ignora esses campos para comandos CONNECT, mas preenchê-los corretamente não custa nada e evita uma violação de protocolo.

## Executando Ambos os Proxies

```python
async def main():
    http_proxy = HTTPProxy(
        port=8080, username='user', password='pass'
    )
    socks5_proxy = SOCKS5Proxy(
        port=1080, username='user', password='pass'
    )
    await asyncio.gather(http_proxy.start(), socks5_proxy.start())

# asyncio.run(main())
```

Você pode testá-los com curl:

```bash
# Proxy HTTP
curl -x http://user:pass@localhost:8080 http://httpbin.org/ip

# HTTPS através de proxy HTTP (túnel CONNECT)
curl -x http://user:pass@localhost:8080 https://httpbin.org/ip

# Proxy SOCKS5
curl --socks5 localhost:1080 --proxy-user user:pass https://httpbin.org/ip
```

## O que o Código Não Lida

Estas implementações omitem várias coisas que proxies de produção lidam. Entender o que está faltando é tão instrutivo quanto entender o que está presente.

Não há limites de conexão. `asyncio.start_server` aceita conexões sem limite, então um único cliente abrindo milhares de conexões esgotaria descritores de arquivo. Proxies de produção usam semáforos ou pools de conexão para limitar concorrência.

Não há validação de destino. Ambos os proxies conectam a qualquer endereço que o cliente solicite, incluindo `127.0.0.1`, `169.254.169.254` (metadados cloud) e faixas de rede interna. Este é um vetor de Server-Side Request Forgery (SSRF). Proxies de produção mantêm listas de negação de faixas de endereços privados e link-local.

Não há logging de tráfego ou métricas. Proxies de produção rastreiam contagem de requisições, bytes transferidos, taxas de erro e percentis de latência, tipicamente exportando para Prometheus ou sistemas similares.

O proxy HTTP não adiciona um cabeçalho `Via`. A RFC 9110 Seção 7.6.3 requer que intermediários adicionem um campo `Via` às mensagens encaminhadas. Isso foi omitido por simplicidade, mas um proxy em conformidade com os padrões deve incluí-lo.

Nenhum dos proxies implementa shutdown gracioso. Quando o servidor para, túneis ativos são terminados abruptamente em vez de serem drenados. Proxies de produção rastreiam conexões ativas e aguardam que completem (com um prazo) antes de encerrar.

## Encadeamento de Proxy

Encadear proxies significa rotear tráfego através de múltiplos proxies em sequência: cliente para proxy A, proxy A para proxy B, proxy B para o servidor destino. Cada proxy na cadeia só conhece seus vizinhos imediatos, não o caminho completo.

O principal caso de uso é distribuir confiança. Se você não confia totalmente em nenhum provedor de proxy individual, encadear dois provedores significa que nenhum deles vê tanto seu IP real quanto seu destino. O tradeoff é latência: cada salto adiciona seu próprio tempo de setup de conexão e atraso de encaminhamento. Um único proxy tipicamente adiciona 50 a 100ms de overhead. Dois proxies aproximadamente dobram isso, e três proxies podem empurrar o overhead total além de 300ms.

Além de dois saltos, o ganho marginal de privacidade diminui enquanto latência e probabilidade de falha aumentam. A maioria das configurações práticas usa um ou dois proxies. O Tor usa três relays (guard, middle, exit) porque seu modelo de ameaça assume que alguns relays estão comprometidos, mas o Tor aceita a penalidade de latência como um tradeoff de design explícito.

```
Client --> Proxy A (SOCKS5) --> Proxy B (SOCKS5) --> Target
           vê: IP do cliente       vê: IP do Proxy A
           vê: endereço do Proxy B  vê: endereço do destino
```

Encadear um proxy SOCKS5 através de outro proxy SOCKS5 funciona fazendo o proxy A tratar o proxy B como o destino. O cliente conecta ao proxy A e envia uma requisição CONNECT para o endereço do proxy B. Uma vez que esse túnel é estabelecido, o cliente envia um segundo handshake SOCKS5 através do túnel, desta vez solicitando o destino real. O proxy A vê tráfego fluindo para o proxy B mas não pode lê-lo se a conexão interna estiver criptografada.

## Referências

- RFC 1928: SOCKS Protocol Version 5 - https://datatracker.ietf.org/doc/html/rfc1928
- RFC 1929: Username/Password Authentication for SOCKS V5 - https://datatracker.ietf.org/doc/html/rfc1929
- RFC 9110: HTTP Semantics - https://www.rfc-editor.org/rfc/rfc9110.html
- RFC 9112: HTTP/1.1 - https://www.rfc-editor.org/rfc/rfc9112.html
- OWASP SSRF Prevention Cheat Sheet - https://cheatsheetseries.owasp.org/cheatsheets/Server_Side_Request_Forgery_Prevention_Cheat_Sheet.html
- mitmproxy (Python HTTPS intercepting proxy) - https://mitmproxy.org/


================================================
FILE: docs/pt/deep-dive/network/http-proxies.md
================================================
# Arquitetura de Proxy HTTP/HTTPS

Proxies HTTP são o protocolo de proxy mais comum na internet. Quase toda rede corporativa os utiliza, e a maioria dos serviços de proxy comerciais os oferece como opção padrão. Eles operam na Camada 7 (Aplicação) do modelo OSI, o que significa que entendem HTTP e podem analisar, modificar, cachear e filtrar tráfego. Essa mesma integração profunda com o protocolo também é sua maior limitação: só podem lidar com tráfego HTTP, revelam uso de proxy através de cabeçalhos identificáveis, e não podem fazer proxy de UDP, o que deixa WebRTC e DNS vulneráveis a vazamentos.

Este documento cobre como proxies HTTP funcionam no nível do protocolo, o método CONNECT para tunelamento HTTPS, mecanismos de autenticação e as implicações de protocolos modernos como HTTP/2 e HTTP/3.

!!! info "Navegação do Módulo"
    - [Fundamentos de Rede](./network-fundamentals.md): TCP/IP, UDP, modelo OSI
    - [Proxies SOCKS](./socks-proxies.md): Alternativa agnóstica a protocolo
    - [Detecção de Proxy](./proxy-detection.md): Como evitar detecção

    Para configuração prática, veja [Configuração de Proxy](../../features/configuration/proxy.md).

## Como Proxies HTTP Funcionam

Um proxy HTTP fica entre o cliente e o servidor destino, mantendo duas conexões TCP separadas: uma do cliente para o proxy, e outra do proxy para o servidor destino. Como o proxy entende HTTP, ele pode tomar decisões inteligentes sobre o tráfego que passa por ele.

### Fluxo de Requisição

Quando um cliente é configurado para usar um proxy HTTP, ele envia a requisição HTTP completa para o proxy em vez de diretamente para o servidor destino. A diferença chave de uma requisição direta é que a linha de requisição inclui a URI absoluta, não apenas o caminho. Por exemplo, em vez de `GET /page HTTP/1.1`, o cliente envia `GET http://example.com/page HTTP/1.1`. Isso diz ao proxy para onde encaminhar a requisição.

```mermaid
sequenceDiagram
    participant Client as Navegador Cliente
    participant Proxy as Proxy HTTP
    participant Server as Servidor Destino

    Client->>Proxy: GET http://example.com/page HTTP/1.1<br/>Host: example.com<br/>User-Agent: Mozilla/5.0
    Note over Client,Proxy: Conexão TCP #1

    Note over Proxy: Analisa requisição, verifica auth,<br/>verifica cache, aplica regras

    Proxy->>Server: GET /page HTTP/1.1<br/>Host: example.com<br/>Via: 1.1 proxy.example.com<br/>X-Forwarded-For: 192.168.1.100
    Note over Proxy,Server: Conexão TCP #2

    Server->>Proxy: HTTP/1.1 200 OK<br/>[corpo da resposta]

    Note over Proxy: Cacheia resposta se permitido,<br/>filtra conteúdo, registra transação

    Proxy->>Client: HTTP/1.1 200 OK<br/>Via: 1.1 proxy.example.com<br/>[corpo possivelmente modificado]
```

O proxy recebe a requisição HTTP completa, analisa o método, URL e cabeçalhos, e decide o que fazer. Ele pode verificar credenciais de autenticação, verificar a URL contra uma lista de controle de acesso, procurar uma cópia em cache do recurso e modificar cabeçalhos antes de encaminhar. Então abre uma conexão TCP separada para o servidor destino e envia a requisição, potencialmente com cabeçalhos alterados.

Quando a resposta chega, o proxy pode cacheá-la de acordo com a semântica HTTP (`Cache-Control`, `ETag`), filtrar o conteúdo para malware ou palavras-chave bloqueadas, comprimi-la se o cliente suportar, e registrar a transação antes de encaminhar a resposta de volta ao cliente.

### Cabeçalhos de Proxy e Privacidade

Proxies HTTP comumente adicionam cabeçalhos que revelam sua presença e o endereço IP real do cliente. O cabeçalho `Via` (RFC 9110) identifica o proxy na cadeia de requisição. O cabeçalho `X-Forwarded-For` contém o IP original do cliente, frequentemente formando uma cadeia se múltiplos proxies estão envolvidos. O cabeçalho `X-Forwarded-Proto` indica se a requisição original era HTTP ou HTTPS. Alguns proxies também adicionam `X-Real-IP` como alternativa mais simples ao `X-Forwarded-For`.

Também existe um cabeçalho padronizado `Forwarded` (RFC 7239) que combina toda essa informação em um único campo, por exemplo `Forwarded: for=192.168.1.100;proto=http;by=proxy.example.com`. Na prática, a maioria dos proxies ainda usa as variantes `X-Forwarded-*` já que têm suporte mais amplo.

Clientes legados e alguns navegadores mais antigos também podem enviar um cabeçalho `Proxy-Connection: keep-alive` em vez de `Connection: keep-alive` ao rotear através de um proxy. Este cabeçalho é um indicador bem conhecido de uso de proxy e um sinal clássico de detecção.

!!! danger "Detecção por Cabeçalho"
    Sistemas de detecção procuram a presença de cabeçalhos `Via`, `X-Forwarded-For` ou `Forwarded` para confirmar uso de proxy. Se `X-Real-IP` não corresponde ao IP de conexão, o proxy é confirmado. Proxies sofisticados podem remover esses cabeçalhos, mas muitos serviços de proxy comerciais os deixam por padrão. Sempre verifique o comportamento do seu proxy usando uma ferramenta como [browserleaks.com/ip](https://browserleaks.com/ip).

### Capacidades e Limitações

Como proxies HTTP analisam e entendem o protocolo HTTP, eles podem ler e modificar cada parte de uma requisição e resposta HTTP não criptografada: URLs, cabeçalhos, cookies e corpos. Isso permite que cacheiem respostas inteligentemente, filtrem conteúdo por URL ou palavra-chave, injetem ou removam cabeçalhos, autentiquem usuários e registrem todo o tráfego em detalhes.

O tradeoff é que esse acoplamento profundo com HTTP significa que o proxy é limitado a tráfego HTTP. Ele não pode nativamente fazer proxy de FTP, SSH, SMTP ou protocolos personalizados (embora o método CONNECT, descrito abaixo, forneça uma solução de tunelamento para qualquer protocolo baseado em TCP). Não tem suporte para UDP, o que significa que tráfego WebRTC, consultas DNS e QUIC/HTTP/3 o ignoram completamente. E inspecionar conteúdo HTTPS requer terminação TLS, que quebra a criptografia de ponta a ponta.

## O Método CONNECT: Tunelamento HTTPS

O método CONNECT (RFC 9110, Seção 9.3.6) resolve um problema fundamental: como um proxy HTTP pode encaminhar tráfego criptografado que não pode ler? A resposta é tornar-se um túnel TCP cego.

Quando um cliente quer acessar um site HTTPS através de um proxy, ele envia uma requisição `CONNECT` pedindo ao proxy para estabelecer uma conexão TCP bruta para o destino. Uma vez que o proxy confirma que o túnel está estabelecido, ele para de ser um proxy HTTP completamente e se torna um relay TCP transparente na Camada 4, encaminhando bytes em ambas as direções sem interpretá-los.

```mermaid
sequenceDiagram
    participant Client
    participant Proxy
    participant Server

    Client->>Proxy: CONNECT example.com:443 HTTP/1.1<br/>Host: example.com:443<br/>Proxy-Authorization: Basic dXNlcjpwYXNz
    Note over Client,Proxy: Requisição HTTP não criptografada

    Proxy->>Server: TCP three-way handshake
    Note over Proxy,Server: Conexão TCP estabelecida

    Proxy->>Client: HTTP/1.1 200 Connection Established

    Note right of Proxy: Proxy agora é um relay<br/>TCP transparente (Camada 4)

    Client->>Server: TLS ClientHello
    Note over Client,Server: Handshake TLS (proxy vê<br/>isso em texto plano)
    Server->>Client: TLS ServerHello, Certificate

    Client->>Server: Requisição HTTP/2 criptografada
    Server->>Client: Resposta HTTP/2 criptografada

    Note over Proxy: Proxy encaminha cegamente<br/>todos os dados criptografados
```

### A Requisição CONNECT

A requisição CONNECT é mínima. O método é `CONNECT`, a URI de requisição é o `host:port` de destino (não um caminho), e inclui autenticação se o proxy a requer. Não há corpo de requisição. O proxy valida as credenciais, verifica suas regras de controle de acesso e abre uma conexão TCP para o host e porta especificados. Se tudo for bem-sucedido, ele envia de volta `HTTP/1.1 200 Connection Established` seguido por uma linha em branco. Após essa linha em branco, a conversação HTTP termina e o proxy se torna um relay transparente.

### Visibilidade Após CONNECT

Uma vez que o túnel é estabelecido, a visibilidade do proxy é limitada. Ele sabe o hostname e porta de destino da requisição CONNECT. Ele pode observar o timing da conexão (quando foi estabelecida e por quanto tempo), o volume de dados transferidos em cada direção, e quando qualquer lado termina a conexão. Ele também pode observar o handshake TLS que se segue, o que é particularmente relevante.

A mensagem TLS ClientHello, enviada imediatamente após o túnel ser estabelecido, é transmitida em texto plano. O proxy (e qualquer observador de rede) pode ler diretamente a versão TLS, a lista completa de cipher suites suportadas, as extensões e seus parâmetros, as curvas elípticas oferecidas, e a extensão SNI (Server Name Indication) que contém o hostname destino. Esta é exatamente a informação usada para TLS fingerprinting (JA3/JA4). Veja [Network Fingerprinting](../fingerprinting/network-fingerprinting.md) para detalhes.

O que o proxy não pode ver é os dados de aplicação criptografados: métodos HTTP, URLs, cabeçalhos de requisição e resposta, cookies, tokens de sessão e conteúdo de resposta são todos criptografados dentro do túnel TLS.

!!! note "SNI e Encrypted Client Hello (ECH)"
    A extensão SNI no ClientHello revela o hostname destino em texto plano, que é redundante com a requisição CONNECT no cenário de proxy mas relevante para outros observadores de rede. Encrypted Client Hello (ECH), atualmente sendo implantado, visa criptografar o SNI para resolver esse vazamento. No entanto, a adoção do ECH ainda é limitada e requer suporte tanto do cliente quanto do servidor.

### CONNECT para Protocolos Não-HTTPS

Embora CONNECT seja usado principalmente para HTTPS, ele pode tunelar qualquer protocolo baseado em TCP. Uma conexão IMAPS na porta 993, uma conexão SSH na porta 22 ou FTP-over-TLS na porta 990 todos funcionam através de um túnel CONNECT. O proxy não precisa entender esses protocolos porque após o túnel ser estabelecido, ele está simplesmente retransmitindo bytes.

Na prática, muitos proxies corporativos restringem CONNECT à porta 443 (HTTPS) para prevenir abuso. Tentar `CONNECT example.com:22` para SSH frequentemente retornará `403 Forbidden`.

### O Dilema do HTTPS

Proxies HTTP enfrentam uma escolha fundamental com tráfego criptografado. Com a abordagem de túnel CONNECT, a criptografia de ponta a ponta é preservada, o cliente verifica o certificado do servidor diretamente, e certificate pinning funciona normalmente. Mas o proxy não pode inspecionar, cachear ou filtrar o conteúdo criptografado.

A alternativa é terminação TLS (MITM), onde o proxy descriptografa o tráfego HTTPS, inspeciona o conteúdo e re-criptografa antes de encaminhar. Isso requer instalar o certificado CA do proxy no cliente, quebra a criptografia de ponta a ponta e é detectável através de certificate pinning e logs de Certificate Transparency. A maioria dos proxies corporativos usa essa abordagem para filtragem de conteúdo e scanning de segurança, enquanto proxies focados em privacidade usam túneis CONNECT cegos.

Para web scraping e automação, essa distinção importa para TLS fingerprinting. Se o proxy realiza terminação TLS, o fingerprint TLS que o servidor destino vê pertence ao proxy, não ao seu navegador. Se você está usando um túnel CONNECT, o fingerprint é preservado de ponta a ponta. Dependendo da sua estratégia de evasão, uma abordagem pode ser preferível à outra.

| Aspecto | HTTP (sem CONNECT) | HTTPS (túnel CONNECT) |
|---------|--------------------|-----------------------|
| Visibilidade do proxy | Requisição/resposta HTTP completa | Apenas host:porta destino + TLS ClientHello |
| Criptografia | Nenhuma (a menos que terminação TLS) | TLS de ponta a ponta |
| Caching | Sim, baseado em semântica HTTP | Não (conteúdo criptografado) |
| Filtragem de conteúdo | Sim | Não (apenas bloqueio baseado em hostname) |
| Modificação de cabeçalhos | Sim | Não (cabeçalhos criptografados) |
| Visibilidade de URL | URL completa | Apenas hostname (via CONNECT e SNI) |
| Suporte a protocolo | Apenas HTTP | Qualquer protocolo sobre TCP |

## Proxies HTTPS (TLS para o Proxy)

Uma distinção que vale esclarecer é a diferença entre fazer proxy de tráfego HTTPS e conectar ao próprio proxy via HTTPS. Quando você configura `--proxy-server=https://proxy:port` em vez de `http://proxy:port`, a conexão entre seu navegador e o proxy é criptografada com TLS. Isso protege suas credenciais de autenticação do proxy de serem interceptadas na rede local e esconde até o hostname CONNECT de observadores locais, já que está encapsulado dentro da conexão TLS para o proxy.

O Chrome suporta isso via o esquema `https://` em `--proxy-server`. É particularmente importante ao usar um proxy em redes não confiáveis (Wi-Fi público, hospedagem compartilhada), onde a conexão entre você e o proxy é o elo mais fraco.

## Autenticação

A autenticação de proxy HTTP usa códigos de status e cabeçalhos HTTP padrão, seguindo a RFC 9110. Quando um proxy requer autenticação, ele responde com `407 Proxy Authentication Required` e um cabeçalho `Proxy-Authenticate` indicando quais esquemas de autenticação suporta. O cliente então retransmite a requisição com um cabeçalho `Proxy-Authorization` contendo as credenciais.

### Esquemas de Autenticação

Existem vários esquemas de autenticação, cada um com características de segurança diferentes.

**Basic** (RFC 7617) é o mais simples. O cliente envia `Proxy-Authorization: Basic <base64(username:password)>`. Base64 é uma codificação, não criptografia, então as credenciais são trivialmente reversíveis. Qualquer um que intercepte o cabeçalho pode decodificá-lo instantaneamente e reusá-lo indefinidamente já que não há proteção contra replay. Auth Basic deve ser usado apenas sobre conexões criptografadas com TLS.

**Digest** (RFC 7616) usa um mecanismo de challenge-response. O proxy envia um nonce aleatório, e o cliente computa um hash do username, password, nonce e URI da requisição. A senha nunca é transmitida, e o nonce fornece proteção contra replay. A versão original usa MD5, que é rápido o suficiente para brute-force eficiente, embora a RFC 7616 tenha adicionado suporte a SHA-256. Auth Digest é raramente implementado por serviços de proxy modernos.

**NTLM** é o protocolo proprietário de challenge-response da Microsoft, comum em ambientes corporativos Windows. Usa uma negociação de três etapas (Tipo 1 negociação, Tipo 2 challenge, Tipo 3 autenticação) e integra com Active Directory para single sign-on. NTLMv1 usa DES (quebrado), e NTLMv2 usa HMAC-MD5 (considerado fraco pelos padrões modernos). A Microsoft recomenda Kerberos sobre NTLM para novas implantações. NTLM é vinculado à conexão, o que significa que quebra com multiplexação HTTP/2.

**Negotiate** (RFC 4559) usa SPNEGO para selecionar entre Kerberos e NTLM, preferindo Kerberos. Kerberos oferece a segurança mais forte (criptografia AES, autenticação mútua, tickets com tempo limitado) mas requer infraestrutura Active Directory, máquinas no domínio e sincronização precisa de relógio. Em automação de navegador, Kerberos é difícil de configurar programaticamente.

| Esquema | Segurança | Mecanismo | Notas Práticas |
|---------|-----------|-----------|----------------|
| Basic | Baixa | Credenciais codificadas em Base64 | Suporte universal. Usar apenas sobre TLS. |
| Digest | Média | Challenge-response com MD5/SHA-256 | Proteção contra replay via nonce. Raramente implementado. |
| NTLM | Média | Challenge-response (NT hash) | SSO Windows. Proprietário, vulnerabilidades conhecidas. |
| Negotiate | Alta | Kerberos/SPNEGO | Mais forte. Requer Active Directory. |

### Autenticação no Pydoll

O Chrome não suporta credenciais de proxy inline na flag `--proxy-server`. Escrever `--proxy-server=http://user:pass@proxy:port` não funciona: o Chrome silenciosamente ignora a porção `user:pass` e conecta sem autenticação.

O Pydoll resolve isso transparentemente através do seu `ProxyManager`. Quando você fornece uma URL de proxy com credenciais embutidas, o Pydoll extrai o username e password, remove-os da URL antes de passá-la ao Chrome, e usa o domínio CDP Fetch para interceptar respostas `407 Proxy Authentication Required` e automaticamente fornecer as credenciais via `Fetch.continueWithAuth`. Essa abordagem funciona para todos os esquemas de autenticação que o Chrome suporta (Basic, Digest, NTLM, Negotiate) sem o Pydoll precisar implementar a lógica específica do protocolo.

```python
from pydoll.browser import Chrome
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
# Pydoll extrai credenciais, limpa a URL e lida com 407 via CDP
options.add_argument('--proxy-server=http://user:pass@proxy.example.com:8080')

async with Chrome(options=options) as browser:
    tab = await browser.start()
    await tab.go_to('https://example.com')
```

!!! tip "Melhores Práticas de Autenticação"
    Sempre use conexões de proxy criptografadas com TLS (proxy HTTPS ou túnel SSH) para proteger credenciais em trânsito. Prefira Bearer tokens para proxies de API já que são revogáveis e com tempo limitado. Nunca use auth Basic sobre uma conexão HTTP não criptografada para o proxy. Não codifique credenciais no código-fonte; use variáveis de ambiente.

## Protocolos Modernos e Proxy

### HTTP/2

HTTP/2 introduziu multiplexação, enquadramento binário e compressão de cabeçalhos HPACK, que mudam fundamentalmente como proxies lidam com conexões. No HTTP/1.1, cada requisição ocupa uma conexão sequencialmente (pipelining existe mas é desabilitado na prática, então navegadores contornam isso abrindo seis conexões paralelas por host). No HTTP/2, uma única conexão TCP carrega múltiplos streams concorrentes, cada um com sua própria requisição e resposta.

Para proxies, isso significa gerenciar IDs de stream, prioridades e janelas de controle de fluxo em ambos os lados da conexão. O proxy deve traduzir entre IDs de stream no lado do cliente e do servidor, manter árvores de prioridade e lidar com controle de fluxo por stream. Isso é significativamente mais complexo que o simples encaminhamento de requisição-resposta do HTTP/1.1.

Da perspectiva de fingerprinting, metadados de stream HTTP/2 (tamanhos de janela, configurações de prioridade, ordenação de cabeçalhos dentro do HPACK) podem fazer fingerprint de clientes individuais mesmo quando múltiplos usuários compartilham o mesmo proxy.

| Recurso | HTTP/1.1 | HTTP/2 |
|---------|----------|--------|
| Conexões | Sequencial por conexão (navegadores abrem 6 em paralelo) | Múltiplos streams concorrentes sobre uma conexão |
| Multiplexação | Não (head-of-line blocking) | Sim (apenas em nível de stream) |
| Compressão de Cabeçalhos | Nenhuma | HPACK |
| Complexidade do Proxy | Encaminhamento simples de requisição/resposta | Mapeamento de ID de stream, gerenciamento de prioridade |

No HTTP/2, o método CONNECT foi estendido pela RFC 8441 para suportar um pseudo-cabeçalho `:protocol`, habilitando tunelamento WebSocket e outras atualizações de protocolo diretamente dentro de streams HTTP/2 sem requerer conexões separadas.

### HTTP/3 e QUIC

HTTP/3 roda sobre QUIC (RFC 9000), que é um protocolo de transporte baseado em UDP. Isso introduz desafios fundamentais para proxies HTTP. Proxies HTTP tradicionais operam sobre TCP e não podem lidar com o tráfego UDP do QUIC. Conexões QUIC podem sobreviver a mudanças de IP (migração de conexão), complicando o gerenciamento de sessão do proxy. E QUIC criptografa quase tudo, incluindo metadados de nível de transporte que eram anteriormente visíveis.

Fazer proxy de QUIC requer CONNECT-UDP (RFC 9298), um novo método para estabelecer túneis UDP através de proxies HTTP. A maioria dos proxies tradicionais, incluindo muitos serviços comerciais, ainda não suporta isso. Navegadores fazem fallback para HTTP/2 sobre TCP quando o proxy não suporta QUIC, o que significa que mais metadados podem vazar do que esperado se você estava contando com o transporte criptografado do HTTP/3.

Em cenários de automação, considere desabilitar QUIC com a flag do Chrome `--disable-quic` para forçar HTTP/2 sobre TCP. Isso garante que todo tráfego passe pelo seu proxy e elimina o risco de vazamentos baseados em UDP do QUIC.

| Aspecto | TCP + TLS (HTTP/1.1, HTTP/2) | QUIC/UDP (HTTP/3) |
|---------|------------------------------|-------------------|
| Transporte | TCP (orientado a conexão) | UDP (sem conexão) |
| Handshake | TCP + TLS separados (2 RTT) | Combinado (0-1 RTT) |
| Head-of-line blocking | Sim (nível TCP) | Não (apenas nível de stream) |
| Migração de conexão | Não suportado | Suportado (sobrevive a mudanças de IP) |
| Compatibilidade com proxy | Excelente | Limitada (requer suporte a relay UDP) |

!!! warning "Downgrade de Protocolo"
    Quando um proxy não suporta HTTP/3, o navegador silenciosamente faz fallback para HTTP/2 ou HTTP/1.1. Este downgrade pode expor metadados (cabeçalhos, padrões de timing) que HTTP/3 teria criptografado. Monitore seu tráfego para entender sua versão de protocolo real, e esteja ciente de que a adoção do HTTP/3 varia por região e CDN.

## Resumo

Proxies HTTP fornecem funcionalidade rica ao custo de escopo limitado e preocupações de privacidade. Eles podem inspecionar, cachear e filtrar tráfego HTTP, mas não podem lidar com protocolos não-HTTP, tráfego UDP ou conteúdo HTTPS sem quebrar a criptografia. Sua presença é revelada através de cabeçalhos identificáveis a menos que explicitamente removidos.

Para automação, o túnel CONNECT é o recurso mais relevante: ele preserva a criptografia TLS de ponta a ponta enquanto dá ao proxy apenas visibilidade em nível de hostname. O Pydoll lida com autenticação de proxy transparentemente através do domínio CDP Fetch, suportando todos os esquemas que o Chrome implementa.

### Proxy HTTP vs SOCKS5

| Necessidade | Proxy HTTP | SOCKS5 |
|-------------|------------|--------|
| Filtragem de conteúdo | Sim | Não |
| Bloqueio baseado em URL | Sim | Não (apenas IP:porta) |
| Caching | Sim | Não |
| Suporte UDP | Não | Sim |
| Flexibilidade de protocolo | Apenas HTTP (CONNECT para tunelamento TCP) | Qualquer TCP/UDP |
| Privacidade | Baixa (analisa HTTP, adiciona cabeçalhos reveladores) | Média (não analisa ou modifica tráfego, mas conteúdo não criptografado ainda é visível ao operador) |
| Resolução DNS | Proxy resolve (remoto) | Depende (SOCKS5: tipicamente cliente resolve, SOCKS5h: proxy resolve. Chrome sempre resolve remotamente para SOCKS5.) |

Para ambientes corporativos que precisam de controle de conteúdo e caching, proxies HTTP são a escolha certa. Para automação focada em privacidade, SOCKS5 oferece melhor stealth e flexibilidade de protocolo. Para segurança máxima, use SOCKS5 sobre um túnel SSH ou VPN.

**Próximos passos:**

- [Proxies SOCKS](./socks-proxies.md): Proxy agnóstico a protocolo na camada de sessão
- [Fundamentos de Rede](./network-fundamentals.md): TCP/IP, UDP, WebRTC
- [Detecção de Proxy](./proxy-detection.md): Como proxies são detectados e como evitar
- [Configuração de Proxy](../../features/configuration/proxy.md): Configuração prática de proxy no Pydoll
- [Network Fingerprinting](../fingerprinting/network-fingerprinting.md): Fingerprinting TCP/IP e TLS

## Referências

- RFC 9110: HTTP Semantics (2022, substitui RFC 7230-7237) - https://www.rfc-editor.org/rfc/rfc9110.html
- RFC 9112: HTTP/1.1 (2022) - https://www.rfc-editor.org/rfc/rfc9112.html
- RFC 9113: HTTP/2 (2022, substitui RFC 7540) - https://www.rfc-editor.org/rfc/rfc9113.html
- RFC 9114: HTTP/3 (2022) - https://www.rfc-editor.org/rfc/rfc9114.html
- RFC 9000: QUIC Transport Protocol (2021) - https://www.rfc-editor.org/rfc/rfc9000.html
- RFC 9298: Proxying UDP in HTTP (CONNECT-UDP, 2022) - https://www.rfc-editor.org/rfc/rfc9298.html
- RFC 8441: Bootstrapping WebSockets with HTTP/2 (2018) - https://www.rfc-editor.org/rfc/rfc8441.html
- RFC 7617: Basic Authentication (2015) - https://www.rfc-editor.org/rfc/rfc7617.html
- RFC 7616: Digest Authentication (2015) - https://www.rfc-editor.org/rfc/rfc7616.html
- RFC 7239: Forwarded HTTP Extension (2014) - https://www.rfc-editor.org/rfc/rfc7239.html
- RFC 4559: Negotiate Authentication (2006) - https://www.rfc-editor.org/rfc/rfc4559.html
- MDN Web Docs: Proxy servers and tunneling - https://developer.mozilla.org/en-US/docs/Web/HTTP/Proxy_servers_and_tunneling
- Chrome DevTools Protocol: Fetch domain - https://chromedevtools.github.io/devtools-protocol/tot/Fetch/


================================================
FILE: docs/pt/deep-dive/network/index.md
================================================
# Análise Profunda de Rede e Segurança

**Bem-vindo ao fundamento da comunicação moderna da internet, o campo de batalha do anonimato, detecção e evasão.**

Protocolos de rede são a infraestrutura invisível que alimenta cada requisição web, conexão de navegador e script de automação. Entendê-los profundamente transforma você de um **usuário de ferramenta** em um **engenheiro de protocolo** capaz de navegar pelos mais sofisticados sistemas anti-bot.

## Por que a Arquitetura de Rede Importa

Quando você executa `tab.go_to('https://example.com')`, uma complexa sinfonia de protocolos entra em ação:

1.  **Resolução DNS** traduz o domínio para um endereço IP (potencialmente vazando sua intenção)
2.  **Handshake TCP** estabelece a conexão (revelando seu SO através de características de pacote)
3.  **Negociação TLS** protege o canal (aplicando fingerprinting no seu navegador via suítes de cifras)
4.  **Requisição HTTP/2** busca a página (expondo a versão do navegador através de frames SETTINGS)
5.  **Descoberta WebRTC** pode sondar seu IP real (contornando completamente sua VPN)

**Cada passo é uma oportunidade para detecção ou evasão.**

!!! danger "A Camada de Rede Não Pode Mentir"
    Diferente das características em nível de navegador (que o JavaScript pode modificar), os fingerprints de nível de rede estão **gravados no kernel do SO e na pilha TCP/IP**. Um desencontro aqui, como um navegador Chrome enviando opções TCP de Linux enquanto alega ser Windows, é instantaneamente fatal para a automação furtiva.

## A Arquitetura da Privacidade na Internet

Este módulo explora os **fundamentos técnicos** que tornam a privacidade possível (e quebrável) na internet moderna:

### A Realidade do Modelo OSI

```mermaid
graph TB
    subgraph "Camada de Aplicação 7"
        HTTP[Cabeçalhos HTTP/HTTPS]
        DNS[Consultas DNS]
    end
    
    subgraph "Camada de Apresentação 6"
        TLS[Fingerprinting TLS/SSL]
        Ciphers[Suítes de Cifras, Extensões]
    end
    
    subgraph "Camadas de Sessão/Transporte 5-4"
        SOCKS[Protocolo Proxy SOCKS]
        TCP[Janela TCP, Opções, ISN]
    end
    
    subgraph "Camada de Rede 3"
        IP[IP TTL, Fragmentação]
        Routing[Roteamento de Pacotes, Saltos]
    end
    
    HTTP --> TLS
    DNS --> TLS
    TLS --> SOCKS
    Ciphers --> TCP
    SOCKS --> IP
    TCP --> Routing
```

**Cada camada é tanto um escudo quanto uma vulnerabilidade:**

- **Camada 7 (Aplicação)**: Proxies podem ler e modificar seu tráfego HTTP
- **Camada 6 (Apresentação)**: Criptografia TLS protege o conteúdo, mas vaza metadados
- **Camada 4 (Transporte)**: Características TCP traem seu sistema operacional
- **Camada 3 (Rede)**: Endereços IP revelam sua localização física

## O que Você Vai Dominar

Este módulo está estruturado como uma **progressão técnica** de fundamentos até a exploração avançada:

### 1. Fundamentos de Rede
**[Fundamentos de Rede](./network-fundamentals.md)**

Construa a base: entenda os protocolos que movem a internet e como eles revelam, ou escondem, sua identidade.

- **Camadas do Modelo OSI** e suas implicações para fingerprinting
- **TCP vs UDP**: Por que seu proxy pode vazar tráfego UDP
- **Vazamento de IP via WebRTC**: A ameaça oculta nos navegadores modernos
- **Características da pilha de rede**: TTL, tamanho da janela, ordem das opções

**Por que começar aqui**: Sem esta base, a configuração de proxy é **"programação de culto à carga"** (cargo cult programming), copiando comandos sem entender por que funcionam (ou não).

### 2. Proxies HTTP/HTTPS
**[Proxies HTTP/HTTPS](./http-proxies.md)**

Domine o protocolo de proxy mais comum e entenda suas limitações fundamentais.

- **Operação de proxy HTTP**: Encaminhamento de requisições, cache, injeção de cabeçalho
- **Tunelamento CONNECT**: Como o HTTPS "passa por um túnel" através de proxies HTTP
- **Complexidades do HTTP/2**: Multiplexação, prioridades de stream, fingerprinting de SETTINGS
- **HTTP/3 e QUIC**: Desafios de proxying baseado em UDP
- **Esquemas de autenticação**: Basic, Digest, NTLM, tokens Bearer

**Visão crítica**: Proxies HTTP operam na Camada 7, eles podem **ler, modificar e registrar** seu tráfego não criptografado. Para privacidade verdadeira, você precisa de criptografia **antes** que o proxy veja seus dados.

### 3. Proxies SOCKS
**[Proxies SOCKS](./socks-proxies.md)**

Entenda por que o SOCKS5 é o **padrão ouro** para automação consciente da privacidade.

- **SOCKS4 vs SOCKS5**: Evolução do protocolo e capacidades
- **Handshake SOCKS5**: Análise profunda do protocolo binário com estruturas de pacotes
- **Suporte UDP**: Jogos, VoIP e WebRTC sobre SOCKS5
- **Resolução DNS**: Por que o DNS no lado do proxy previne vazamentos
- **Por que SOCKS5 > proxies HTTP**: Comparação em nível de protocolo

**Vantagem chave**: SOCKS opera na Camada 5 (Sessão), **abaixo** da camada de aplicação. Ele não pode ler seu tráfego HTTP, apenas ver IPs de destino, reduzindo vastamente a superfície de confiança.

### 4. Detecção de Proxy
**[Detecção de Proxy e Anonimato](./proxy-detection.md)**

Aprenda como sites **detectam o uso de proxy** e como evadir a detecção.

- **Níveis de anonimato**: Proxies transparentes, anônimos, elite
- **Bancos de dados de reputação de IP**: Como seu IP de datacenter te trai
- **Análise de cabeçalhos**: Cabeçalhos X-Forwarded-For, Via, Forwarded
- **Checagens de consistência**: DNS reverso, desencontros de geolocalização
- **Integração de fingerprinting de rede**: Combinando detecção de proxy com análise TCP/TLS

**Dura realidade**: A maioria dos proxies "anônimos" é trivialmente detectável. Furtividade verdadeira requer **proxies residenciais de elite** + **fingerprinting de navegador consistente** + **comportamento semelhante ao humano**.

### 5. Construindo Servidores Proxy
**[Construindo Seu Próprio Proxy](./build-proxy.md)**

Implemente proxies HTTP e SOCKS5 do zero em Python, a experiência de aprendizado definitiva.

- **Servidor proxy HTTP**: Implementação assíncrona completa com autenticação
- **Servidor proxy SOCKS5**: Manipulação de protocolo binário, tunelamento TCP
- **Encadeamento de proxy (Proxy chaining)**: Anonimato em camadas (e trocas de latência)
- **Pools de proxy rotativos**: Verificação de saúde, failover, balanceamento de carga
- **Tópicos avançados**: Proxies transparentes, interceptação SSL MITM

**Por que construir o seu**: Entender detalhes de implementação revela **vetores de ataque** e **oportunidades de otimização** invisíveis do exterior.

### 6. Considerações Legais e Éticas
**[Diretrizes Legais e Éticas](./proxy-legal.md)**

Navegue pelo campo minado legal do uso de proxy e automação web.

- **Conformidade regulatória**: GDPR, CFAA, leis internacionais
- **Termos de Serviço**: O que constitui violação
- **Diretrizes éticas**: robots.txt, limitação de taxa, transparência
- **Estudos de caso**: Precedentes legais (hiQ vs LinkedIn, QVC vs Resultly)
- **Quando evitar proxies**: Cenários de alto risco

**Aviso**: Esta é **informação educacional**, não aconselhamento jurídico. A lei varia muito por jurisdição e caso de uso. Consulte um advogado qualificado.

## O Paradoxo do Proxy

Aqui está a verdade desconfortável sobre proxies:

!!! warning "Proxies Não Te Tornam Anônimo. Eles Te Tornam **Diferente**"
    Um proxy muda seu endereço IP, mas ele também:
    
    - Adiciona **latência** (detectável via análise de tempo)
    - Reseta valores de **TTL** (revelando saltos do proxy)
    - Introduz desencontros de **fingerprint TCP** (SO do proxy ≠ seu SO)
    - Pode injetar **cabeçalhos** (X-Forwarded-For, Via)
    - Cria **inconsistências de geolocalização** (fuso horário do navegador ≠ localização do IP)
    
    Proxies são uma **ferramenta**, não uma solução. Furtividade verdadeira requer **consistência holística**.

## Pré-requisitos

Este é um **material avançado**. Você deve estar confortável com:

Conceitos básicos de redes (endereços IP, portas, protocolos)
Fundamentos de TCP/IP (three-way handshake, pacotes, roteamento)
Programação Python assíncrona (asyncio, async/await)
Básico do Pydoll (veja [Conceitos Principais](../../features/core-concepts.md))

**Se você é novo em redes**, recomendamos fortemente:

1.  Ler um guia de fundamentos de TCP/IP primeiro
2.  Experimentar com o Wireshark para visualizar o tráfego de rede
3.  Tentar os exemplos de código com capturas de pacotes rodando
4.  Construir os servidores proxy e testá-los localmente

## Integração com Outros Módulos

Arquitetura de rede não existe isoladamente. Ela se integra profundamente com:

- **[Fingerprinting](../fingerprinting/network-fingerprinting.md)**: Como características TCP/IP e TLS te identificam
- **[Configuração do Navegador](../../features/configuration/browser-preferences.md)**: Alinhando comportamento do navegador com características do proxy
- **[Camada de Conexão](../fundamentals/connection-layer.md)**: Como o Pydoll gerencia conexões WebSocket sobre proxies

## A Trilha de Aprendizagem

Recomendamos esta progressão:

**Fase 1: Fundação**

1.  Leia [Fundamentos de Rede](./network-fundamentals.md)
2.  Entenda o modelo OSI e as camadas de protocolo
3.  Aprenda sobre vazamentos WebRTC e tunelamento UDP

**Fase 2: Análise Profunda de Protocolo**

4.  Estude [Proxies HTTP/HTTPS](./http-proxies.md)
5.  Domine [Proxies SOCKS](./socks-proxies.md)
6.  Compare protocolos e entenda as trocas

**Fase 3: Pensamento Adversário**

7.  Explore [Detecção de Proxy](./proxy-detection.md)
8.  Aprenda técnicas de detecção da perspectiva do defensor
9.  Aplique estratégias de evasão

**Fase 4: Implementação Prática**

10. Construa servidores proxy de [Construindo Proxies](./build-proxy.md)
11. Capture e analise tráfego com Wireshark
12. Teste cadeias de proxy e estratégias de rotação

**Fase 5: Segurança Operacional**

13. Revise as diretrizes [Legais e Éticas](./proxy-legal.md)
14. Entenda os requisitos de conformidade
15. Desenvolva políticas de automação responsáveis


## A Filosofia

Conhecimento de rede e segurança é **poder fundamental**. Diferente de habilidades específicas de frameworks (que se tornam obsoletas), o conhecimento de protocolos é **atemporal**:

- TCP não mudou fundamentalmente desde a RFC 793 (1981)
- TLS constrói sobre conceitos do SSL (1995)
- HTTP/2 (2015) e HTTP/3 (2022) são evoluções, não revoluções

Domine esses fundamentos uma vez, e você entenderá **todo sistema baseado em rede** que encontrar pelo resto de sua carreira.

## Compromisso Ético

Antes de prosseguir, reconheça:

Eu entendo que proxies podem ser usados tanto para fins legítimos quanto maliciosos
Eu respeitarei os termos de serviço dos sites e o robots.txt
Eu implementarei limitação de taxa e rastreamento respeitoso
Eu não usarei este conhecimento para fraude, abuso ou atividades ilegais
Eu consultarei aconselhamento jurídico quando incerto sobre conformidade

**Com grandes poderes vêm grandes responsabilidades.** Use este conhecimento com sabedoria.

---

## Pronto para Começar?

Comece sua jornada com **[Fundamentos de Rede](./network-fundamentals.md)** para construir a base, então progrida através dos módulos em ordem. Cada documento constrói sobre o anterior, criando um entendimento abrangente de arquitetura de rede para automação.

**É aqui que "script kiddies" se tornam engenheiros. Vamos começar.**

---

!!! info "Status da Documentação"
    Este módulo sintetiza conhecimento de RFCs, especificações de protocolo, pesquisa em segurança e testes do mundo real. Todo exemplo de código está pronto para produção. Se encontrar imprecisões ou tiver melhorias, contribuições são bem-vindas.

## Navegação Rápida

**Protocolos Principais:**

- [Fundamentos de Rede](./network-fundamentals.md) - TCP/IP, UDP, WebRTC
- [Proxies HTTP/HTTPS](./http-proxies.md) - Proxying de camada de aplicação
- [Proxies SOCKS](./socks-proxies.md) - Proxying de camada de sessão

**Tópicos Avançados:**

- [Detecção de Proxy](./proxy-detection.md) - Anonimato e evasão
- [Construindo Proxies](./build-proxy.md) - Implementação do zero
- [Legal e Ético](./proxy-legal.md) - Conformidade e responsabilidade

**Módulos Relacionados:**

- [Fingerprinting](../fingerprinting/index.md) - Técnicas de detecção
- [Configuração do Navegador](../../features/configuration/browser-options.md) - Configuração prática

================================================
FILE: docs/pt/deep-dive/network/network-fundamentals.md
================================================
# Fundamentos de Rede

Este documento cobre os protocolos de rede fundamentais que alimentam a internet e como eles podem expor ou proteger sua identidade em cenários de automação. Uma compreensão funcional de TCP, UDP, do modelo OSI e do WebRTC tornará a configuração de proxy muito menos misteriosa e muito mais eficaz.

!!! info "Navegação do Módulo"
    - [Visão Geral de Rede e Segurança](./index.md): Introdução ao módulo e trilha de aprendizado
    - [Proxies HTTP/HTTPS](./http-proxies.md): Proxy de camada de aplicação
    - [Proxies SOCKS](./socks-proxies.md): Proxy de camada de sessão

    Para uso prático do Pydoll, veja [Configuração de Proxy](../../features/configuration/proxy.md) e [Opções do Navegador](../../features/configuration/browser-options.md).

## A Pilha de Rede

Cada requisição HTTP que seu navegador faz viaja através de uma pilha de rede em camadas. Cada camada tem responsabilidades, protocolos e implicações de segurança específicas. Proxies operam em camadas diferentes, e a camada determina o que o proxy pode ver, modificar e ocultar. Características de rede em camadas inferiores podem aplicar fingerprinting no seu sistema real mesmo através de proxies, então entender a pilha ajuda você a ver onde ocorrem vazamentos de identidade e como preveni-los.

### O Modelo OSI

O modelo OSI (Open Systems Interconnection), desenvolvido pela ISO em 1984, fornece um framework conceitual para entender como os protocolos de rede interagem. As redes do mundo real usam o modelo TCP/IP (que antecede o OSI e tem apenas 4 camadas), mas a terminologia OSI permanece como a forma padrão de descrever onde os proxies operam e o que eles podem acessar.

```mermaid
graph TD
    L7[Layer 7: Application - HTTP, FTP, SMTP, DNS]
    L6[Layer 6: Presentation - Encryption, Compression]
    L5[Layer 5: Session - SOCKS]
    L4[Layer 4: Transport - TCP, UDP]
    L3[Layer 3: Network - IP, ICMP]
    L2[Layer 2: Data Link - Ethernet, WiFi]
    L1[Layer 1: Physical - Cables, Radio Waves]

    L7 --> L6 --> L5 --> L4 --> L3 --> L2 --> L1
```

A Camada 7 (Aplicação) é onde vivem os protocolos voltados ao usuário: HTTP, HTTPS, FTP, SMTP e DNS operam aqui. Esta camada contém os dados reais com os quais sua aplicação se importa, como documentos HTML, respostas JSON e transferências de arquivos. Proxies HTTP operam nesta camada, o que lhes dá visibilidade total sobre o conteúdo de requisição e resposta.

A Camada 6 (Apresentação) lida com tradução de formato de dados, criptografia e compressão. SSL/TLS é comumente associado a esta camada pelo seu papel de criptografia, embora na prática o TLS abranja as Camadas 4 a 6 e não se mapeie de forma limpa a nenhuma camada OSI específica. O que importa para automação é que a criptografia HTTPS acontece aqui, criptografando os dados da Camada 7 antes de descerem pela pilha.

A Camada 5 (Sessão) gerencia conexões entre aplicações. Proxies SOCKS operam aqui, abaixo da camada de aplicação mas acima da de transporte. Esta posição torna o SOCKS agnóstico a protocolo: ele pode proxyar qualquer protocolo da Camada 7 (HTTP, FTP, SMTP, SSH) sem precisar entender suas especificidades.

A Camada 4 (Transporte) fornece entrega de dados de ponta a ponta. TCP (orientado à conexão, confiável) e UDP (sem conexão, rápido) são os protocolos dominantes aqui. Esta camada lida com números de porta, controle de fluxo e correção de erros. Todos os proxies dependem, em última análise, da Camada 4 para a transmissão real de dados.

A Camada 3 (Rede) lida com roteamento e endereçamento entre redes. O IP (Internet Protocol) opera aqui, gerenciando endereços IP e decisões de roteamento. É aqui que seu endereço IP real reside, e onde os proxies tentam substituí-lo.

A Camada 2 (Enlace de Dados) gerencia a comunicação no mesmo segmento de rede físico. Ethernet, Wi-Fi e PPP operam aqui, lidando com endereços MAC e transmissão de frames. Endereços MAC são visíveis apenas no segmento de rede local e não são diretamente acessíveis por servidores remotos, embora possam ser expostos através de protocolos como IPv6 SLAAC (que incorpora o MAC no endereço).

A Camada 1 (Física) é o hardware real: cabos, ondas de rádio e níveis de voltagem. Raramente relevante para automação de software.

!!! tip "OSI vs TCP/IP"
    O modelo TCP/IP (4 camadas: Enlace, Internet, Transporte, Aplicação) é o que as redes realmente usam. O OSI (7 camadas) é uma ferramenta de ensino e modelo de referência. Quando as pessoas dizem "proxy de Camada 7", elas estão usando a terminologia OSI, mas a implementação real roda sobre TCP/IP.

### Como o Posicionamento da Camada Afeta os Proxies

A camada onde um proxy opera determina o que ele pode e o que não pode fazer.

Proxies HTTP/HTTPS operam na Camada 7 (Aplicação). Como eles entendem HTTP, podem ler e modificar URLs, cabeçalhos, cookies e corpos de requisição. Podem fazer cache de respostas de forma inteligente com base na semântica HTTP, filtrar conteúdo por URL ou palavra-chave e injetar cabeçalhos de autenticação. A contrapartida é que eles só entendem HTTP. Não podem proxyar FTP, SMTP, SSH ou outros protocolos, e inspecionar conteúdo HTTPS requer terminação TLS, o que significa descriptografar e recriptografar o tráfego.

Proxies SOCKS operam na Camada 5 (Sessão). Como ficam abaixo da camada de aplicação, são agnósticos a protocolo e podem proxyar qualquer protocolo da Camada 7 sem modificação. O tráfego HTTPS passa criptografado de ponta a ponta, já que o proxy SOCKS nunca precisa descriptografá-lo. O SOCKS5 também suporta UDP, permitindo proxyar consultas DNS, VoIP e outros protocolos baseados em UDP. A contrapartida é que proxies SOCKS não têm visibilidade dos dados da camada de aplicação: não podem fazer cache, filtrar por URL ou inspecionar conteúdo. Podem apenas filtrar por IP e porta.

!!! note "A Contrapartida Fundamental"
    Camadas mais altas (Camada 7) oferecem mais controle mas menos flexibilidade. Camadas mais baixas (Camada 5) oferecem menos controle mas mais flexibilidade. Escolha proxies HTTP quando precisar de controle de conteúdo, e proxies SOCKS quando precisar de flexibilidade de protocolo ou criptografia de ponta a ponta.

### O Problema de Vazamento de Camada

Mesmo com um proxy de Camada 7 perfeito, características de camadas inferiores podem expor sua identidade real. A pilha TCP do seu sistema operacional na Camada 4 tem um fingerprint único definido pelo tamanho da janela, ordem das opções e valores de TTL. Campos do cabeçalho IP na Camada 3, como TTL e comportamento de fragmentação, revelam seu SO e topologia de rede.

Por exemplo, se você configurar um proxy para apresentar um User-Agent de "Windows 10", mas o fingerprint TCP real do seu sistema Linux contradizer isso na Camada 4, sistemas de detecção sofisticados podem marcar essa inconsistência como um forte indicador de bot. É por isso que o fingerprinting em nível de rede (abordado em [Network Fingerprinting](../fingerprinting/network-fingerprinting.md)) é tão perigoso: ele opera abaixo da camada do proxy, expondo seu sistema real mesmo quando o proxy da camada de aplicação é impecável.

## TCP vs UDP

Na Camada 4 (Transporte), dois protocolos fundamentalmente diferentes dominam a comunicação na internet. Eles representam filosofias de design opostas: confiabilidade versus velocidade.

O TCP é orientado à conexão. Pense nele como uma ligação telefônica: você estabelece uma conexão, verifica se a outra parte está ouvindo, troca dados de forma confiável e, em seguida, desliga. Cada byte é confirmado, ordenado e tem entrega garantida. O UDP é sem conexão. Você envia seus dados e espera que cheguem. Sem handshake, sem confirmações, sem garantias. Apenas velocidade bruta com sobrecarga mínima.

| Característica | TCP | UDP |
|---------|-----|-----|
| Conexão | Orientado à conexão (handshake necessário) | Sem conexão (sem handshake) |
| Confiabilidade | Entrega garantida, pacotes ordenados | Entrega de melhor esforço, pacotes podem ser perdidos |
| Velocidade | Mais lento (sobrecarga dos mecanismos de confiabilidade) | Mais rápido (sobrecarga mínima) |
| Casos de Uso | Navegação web, transferência de arquivos, email | Streaming de vídeo, consultas DNS, jogos |
| Tamanho do Cabeçalho | 20 bytes mínimo (até 60 com opções) | 8 bytes fixo |
| Controle de Fluxo | Sim (janela deslizante, orientado pelo receptor) | Não (transmissor envia à vontade) |
| Controle de Congestionamento | Sim (desacelera quando a rede está congestionada) | Não (responsabilidade da aplicação) |
| Verificação de Erros | Extensiva (checksum + acknowledgments) | Básica (apenas checksum; opcional no IPv4, obrigatório no IPv6) |
| Ordenação | Pacotes reordenados se recebidos fora de sequência | Sem ordenação, pacotes entregues como recebidos |
| Retransmissão | Automática (pacotes perdidos são retransmitidos) | Nenhuma (aplicação deve tratar) |

### TCP e Proxies

Todos os protocolos de proxy (HTTP, HTTPS, SOCKS4, SOCKS5) usam TCP para seu canal de controle. Isso ocorre porque a autenticação de proxy e a troca de comandos exigem entrega garantida, protocolos de proxy têm sequências de comando estritas (handshake, depois auth, depois dados), e proxies precisam de conexões persistentes para rastrear o estado do cliente.

No entanto, o SOCKS5 também pode proxyar tráfego UDP, diferente do SOCKS4 ou de proxies HTTP. Isso torna o SOCKS5 essencial para proxyar consultas DNS, áudio/vídeo WebRTC, VoIP e protocolos de jogos.

!!! danger "UDP e Vazamento de IP"
    A maioria das conexões de navegador usa TCP (HTTP, WebSocket, etc.), mas o WebRTC usa UDP diretamente, contornando a configuração de proxy do navegador. Esta é a causa mais comum de vazamento de IP em automação de navegador com proxy: seu tráfego TCP passa pelo proxy enquanto seu tráfego UDP vaza seu IP real.

### O Handshake de Três Vias do TCP

Antes que quaisquer dados possam ser transmitidos, o TCP requer um handshake de três vias para estabelecer uma conexão. Esta negociação sincroniza números de sequência, acorda tamanhos de janela e estabelece o estado da conexão em ambas as pontas.

```mermaid
sequenceDiagram
    participant Client
    participant Server

    Client->>Server: SYN (Synchronize, seq=x)
    Note over Client,Server: Client requests connection

    Server->>Client: SYN-ACK (seq=y, ack=x+1)
    Note over Client,Server: Server acknowledges and sends its own SYN

    Client->>Server: ACK (ack=y+1)
    Note over Client,Server: Connection established, data transfer begins
```

O processo começa quando o cliente envia um pacote SYN (Synchronize) contendo um Número de Sequência Inicial (ISN) aleatório, por exemplo `seq=1000`. Junto com o ISN, opções TCP são negociadas: tamanho da janela, Tamanho Máximo de Segmento (MSS), timestamps e suporte a SACK.

O servidor responde com um SYN-ACK: ele escolhe seu próprio ISN aleatório (ex: `seq=5000`) e confirma o ISN do cliente definindo `ack=1001` (ISN do cliente + 1). Este único pacote tanto estabelece a direção servidor-para-cliente (SYN) quanto confirma a direção cliente-para-servidor (ACK). O servidor também retorna suas próprias opções TCP.

O cliente então envia um ACK final, confirmando o ISN do servidor (`ack=5001`). Neste ponto, a conexão está totalmente estabelecida em ambas as direções e a transmissão de dados pode começar.

O ISN é aleatorizado em vez de começar do zero para prevenir ataques de sequestro de TCP. Se ISNs fossem previsíveis, um atacante poderia injetar pacotes em uma conexão existente adivinhando os números de sequência. Sistemas modernos usam aleatoriedade criptográfica para seleção de ISN (RFC 6528).

### Fingerprinting TCP

O handshake TCP revela características que aplicam fingerprinting no seu sistema operacional. Diferentes SOs usam valores padrão diferentes para o tamanho inicial da janela, ordem das opções TCP, TTL (Time To Live), fator de escala da janela e comportamento de timestamp. Esses valores são definidos pelo kernel, não pelo navegador, então um proxy não pode alterá-los.

Aqui estão exemplos ilustrativos para sistemas operacionais modernos. Note que os valores reais variam entre versões de SO, configurações de kernel e ajustes de rede:

```
Windows 10/11 (modern builds):
    Window Size: 65535
    MSS: 1460
    Options: MSS, NOP, WS, NOP, NOP, SACK_PERM
    TTL: 128

Linux (kernel 5.x+, Ubuntu 20.04+):
    Window Size: 29200
    MSS: 1460
    Options: MSS, SACK_PERM, TS, NOP, WS
    TTL: 64

macOS (Monterey+):
    Window Size: 65535
    TTL: 64
```

Essas diferenças estão gravadas no kernel. Um proxy não pode alterá-las porque são definidas pelo seu sistema operacional, não pelo seu navegador. É assim que sistemas de detecção sofisticados podem identificá-lo mesmo através de proxies.

!!! warning "Limitação do Proxy"
    Proxies HTTP e SOCKS operam acima da camada TCP. Eles não podem modificar características do handshake TCP. O fingerprint TCP do seu SO está sempre exposto ao servidor proxy e a quaisquer observadores de rede entre você e o proxy. Apenas soluções em nível de VPN ou configuração da pilha TCP em nível de SO podem resolver isso.

!!! note "Além do Fingerprinting TCP"
    O handshake TCP é apenas a primeira oportunidade de fingerprinting. Imediatamente após, o handshake TLS revela outro fingerprint único conhecido como JA3/JA4. Veja [Network Fingerprinting](../fingerprinting/network-fingerprinting.md) para detalhes sobre fingerprinting de TLS e HTTP/2.

### UDP

Diferente da abordagem confiável e orientada à conexão do TCP, o UDP é um protocolo de "dispare-e-esqueça". Ele troca confiabilidade por latência e sobrecarga mínimas, tornando-o ideal para aplicações em tempo real onde a velocidade importa mais que a entrega perfeita.

Um datagrama UDP tem apenas um cabeçalho de 8 bytes (comparado com 20-60 bytes do TCP), contendo porta de origem, porta de destino, comprimento e um checksum. Não há estabelecimento de conexão, nenhuma garantia de confiabilidade, nenhum controle de fluxo e nenhum controle de congestionamento. Se um pacote for perdido, a aplicação deve decidir se e como tratar isso.

O UDP é a escolha certa para comunicação em tempo real (chamadas de voz/vídeo via WebRTC e VoIP), jogos (atualizações de estado de baixa latência), streaming (onde perda ocasional de frames é aceitável) e consultas DNS (pares pequenos de requisição/resposta onde a aplicação cuida das retentativas). É uma escolha ruim para transferências de arquivos, navegação web, email ou bancos de dados, todos os quais precisam de entrega confiável e ordenada.

O DNS é um exemplo particularmente importante no contexto de automação. O DNS usa UDP porque as consultas são tipicamente pequenas e se beneficiam da ausência de sobrecarga de handshake do UDP. Embora o EDNS0 (RFC 6891) tenha aumentado o payload máximo de DNS sobre UDP além do limite original de 512 bytes, a maioria das consultas permanece compacta. O cliente DNS cuida das retentativas em nível de aplicação se uma resposta não chegar dentro do timeout.

Para automação de navegador, a preocupação principal com o UDP é que o WebRTC o utiliza para áudio e vídeo em tempo real, consultas DNS o utilizam para resolução de domínio, e a maioria dos proxies (HTTP, HTTPS, SOCKS4) só lida com TCP. A menos que você configure explicitamente o proxy de UDP, esse tráfego contorna seu proxy e vaza seu IP real.

| Tipo de Proxy | Suporte UDP | Notas |
|------------|-------------|-------|
| Proxy HTTP | Não | Proxyia apenas HTTP/HTTPS baseado em TCP |
| Proxy HTTPS (CONNECT) | Não | O método CONNECT só estabelece túneis TCP |
| SOCKS4 | Não | Protocolo apenas TCP |
| SOCKS5 | Sim | Suporta relay UDP via comando `UDP ASSOCIATE` |
| VPN | Sim | Tunela todo o tráfego IP (TCP e UDP) |

Para anonimato verdadeiro em automação de navegador, você precisa de: um proxy SOCKS5 com suporte UDP e WebRTC configurado para usá-lo, WebRTC desabilitado inteiramente (o que quebra videoconferência), uma VPN que tunele todo o tráfego, ou a flag do navegador `--force-webrtc-ip-handling-policy=disable_non_proxied_udp`.

### QUIC e HTTP/3

Navegadores modernos utilizam cada vez mais o QUIC (RFC 9000), um protocolo de transporte baseado em UDP que alimenta o HTTP/3. Como o QUIC roda sobre UDP, ele compartilha os mesmos problemas de bypass de proxy que o WebRTC e o DNS: a maioria dos proxies HTTP não consegue lidar com tráfego QUIC, e ele pode vazar para fora da sua configuração de proxy.

Em cenários de automação, considere desabilitar o QUIC com a flag `--disable-quic` do Chrome para forçar HTTP/2 sobre TCP, garantindo que todo o tráfego web passe pelo seu proxy. O QUIC também tem suas próprias características de fingerprinting, similares ao JA3 para TLS, o que adiciona mais um vetor de detecção.

## WebRTC e Vazamento de IP

WebRTC (Web Real-Time Communication) é uma API de navegador padronizada pelo W3C que permite comunicação ponto-a-ponto de áudio, vídeo e dados diretamente entre navegadores, sem plugins ou servidores intermediários. Embora poderosa para aplicações em tempo real, o WebRTC é a maior fonte isolada de vazamento de IP em automação de navegador com proxy.

### Como o WebRTC Vaza Seu IP

O WebRTC foi projetado para conexões ponto-a-ponto diretas, otimizando para baixa latência em detrimento da privacidade. Para estabelecer conexões P2P, o WebRTC deve descobrir seu endereço IP público real e compartilhá-lo com o par remoto, mesmo se seu navegador estiver configurado para usar um proxy.

O problema se desenrola assim: seu navegador usa um proxy para tráfego HTTP/HTTPS (que é TCP), mas o WebRTC usa servidores STUN para descobrir seu IP público real sobre UDP. Consultas STUN contornam o proxy porque a maioria dos proxies só lida com TCP. Seu IP real é descoberto e compartilhado com pares remotos como parte da negociação de conexão. JavaScript na página pode ler esses "candidatos ICE" e enviar seu IP real para o servidor do site.

!!! danger "Gravidade dos Vazamentos WebRTC"
    Mesmo com um proxy HTTP configurado corretamente, proxy HTTPS funcionando, consultas DNS proxyadas, User-Agent falsificado e fingerprinting de canvas mitigado, o WebRTC ainda pode vazar seu IP real em milissegundos. Isso porque o WebRTC opera abaixo da camada de proxy do navegador, interagindo diretamente com a pilha de rede do SO.

### O Processo ICE

O WebRTC usa ICE (Interactive Connectivity Establishment, RFC 8445) para descobrir caminhos de conexão possíveis e selecionar o melhor. Este processo inerentemente revela sua topologia de rede ao coletar três tipos de candidatos.

```mermaid
sequenceDiagram
    participant Browser
    participant STUN as STUN Server
    participant TURN as TURN Relay
    participant Peer as Remote Peer

    Note over Browser: WebRTC connection initiated

    Browser->>Browser: Gather local IP addresses<br/>(LAN interfaces)
    Note over Browser: Local candidate:<br/>192.168.1.100:54321

    Browser->>STUN: STUN Binding Request (over UDP)
    Note over STUN: STUN server discovers public IP<br/>(bypasses proxy!)
    STUN->>Browser: STUN Response with real public IP
    Note over Browser: Server reflexive candidate:<br/>203.0.113.45:54321

    Browser->>TURN: Allocate relay (if needed)
    TURN->>Browser: Relay address assigned
    Note over Browser: Relay candidate:<br/>198.51.100.10:61234

    Browser->>Peer: Send all ICE candidates<br/>(local + public + relay)
    Note over Peer: Now knows your:<br/>- LAN IP<br/>- Real public IP<br/>- Relay address

    Peer->>Browser: Send ICE candidates

    Note over Browser,Peer: ICE negotiation: try direct P2P first

    alt Direct P2P succeeds
        Browser<<->>Peer: Direct connection (bypasses proxy entirely!)
    else Direct P2P fails (firewall/NAT)
        Browser->>TURN: Use TURN relay
        TURN<<->>Peer: Relayed connection
        Note over Browser,Peer: Higher latency, but works
    end
```

### Tipos de Candidatos ICE

O ICE descobre três tipos de candidatos (possíveis endpoints de conexão), cada um revelando diferentes informações sobre sua rede.

**Candidatos host** são seus endereços IP locais da LAN. O navegador enumera todas as interfaces de rede locais e cria candidatos para cada uma. Isso revela seus endereços IP locais em redes privadas, sua topologia de rede (presença de interfaces VPN, pontes de VM) e o número de interfaces de rede.

```javascript
// Example host candidates
candidate:1 1 UDP 2130706431 192.168.1.100 54321 typ host
candidate:2 1 UDP 2130706431 10.0.0.5 54322 typ host
```

Navegadores modernos (Chrome 75+, Firefox 78+, Safari) mitigam vazamentos de candidatos host substituindo endereços IP locais por nomes mDNS efêmeros (ex: `a1b2c3d4.local`) quando permissões de mídia (câmera/microfone) não foram concedidas. No entanto, candidatos reflexivos de servidor (seu IP público) permanecem expostos independentemente do mDNS.

**Candidatos reflexivos de servidor** são seu IP público como visto por um servidor STUN. O navegador envia uma requisição STUN para um servidor público, que responde com seu endereço IP público. Este é o vazamento do qual todos falam: seu proxy mostra um IP, mas o WebRTC revela o seu real, junto com seu tipo de NAT, mapeamento de porta externa e informações do ISP.

```javascript
// Server reflexive candidate (your real public IP)
candidate:4 1 UDP 1694498815 203.0.113.45 54321 typ srflx raddr 192.168.1.100 rport 54321
```

**Candidatos de retransmissão** são endereços de servidores TURN usados como fallback quando o P2P direto falha. O candidato de retransmissão ainda pode conter seu IP real no campo `raddr` (endereço remoto), dependendo da implementação do servidor TURN.

```javascript
// Relay candidate (TURN server address)
candidate:5 1 UDP 16777215 198.51.100.10 61234 typ relay raddr 203.0.113.45 rport 54321
```

### O Protocolo STUN

STUN (Session Traversal Utilities for NAT, RFC 8489) é um protocolo simples de requisição-resposta sobre UDP. Sua função é direta: o cliente pergunta "qual IP você vê de mim?" e o servidor responde com o IP público e a porta do cliente.

O cliente envia uma Binding Request contendo um magic cookie (`0x2112A442`, um valor fixo definido pela RFC) e um transaction ID aleatório de 12 bytes. O servidor responde com uma Binding Success Response que inclui um atributo `XOR-MAPPED-ADDRESS` contendo o IP público e a porta do cliente como vistos da perspectiva do servidor.

O endereço IP na resposta é XOR'ado com o magic cookie e o transaction ID. Isso não é por segurança, mas por compatibilidade com NAT: alguns dispositivos NAT modificam incorretamente endereços IP em payloads de pacotes, e o XOR ofusca o endereço para prevenir essa interferência.

Servidores STUN públicos comumente usados por navegadores incluem `stun.l.google.com:19302` (Google), `stun1.l.google.com:19302` (Google), `stun.services.mozilla.com` (Mozilla) e `stun.stunprotocol.org:3478`.

### Por que Proxies Não Conseguem Parar Vazamentos WebRTC

Vazamentos WebRTC acontecem por vários motivos que se reforçam. Primeiro, o WebRTC usa UDP, e a maioria dos proxies (HTTP, HTTPS CONNECT, SOCKS4) só lida com TCP. Apenas o SOCKS5 suporta UDP, e mesmo assim o navegador precisa ser explicitamente configurado para rotear o WebRTC através dele.

Segundo, o WebRTC é uma API de navegador que opera abaixo da camada HTTP. Ele acessa diretamente a pilha de rede do SO, contornando configurações de proxy definidas para HTTP/HTTPS. Consultas STUN vão diretamente para a interface de rede, e a tabela de roteamento do SO determina seu caminho, não a configuração de proxy do navegador. Apenas roteamento em nível de VPN pode interceptá-las.

Terceiro, o WebRTC enumera todas as interfaces de rede (ethernet física, Wi-Fi, adaptadores VPN, pontes de VM), incluindo interfaces não usadas para navegação regular. Isso vaza sua topologia de rede interna.

Finalmente, páginas web podem ler candidatos ICE via JavaScript usando o evento `RTCPeerConnection.onicecandidate`, extrair endereços IP das strings de candidatos com um regex simples e enviar seu IP real para o servidor de rastreamento deles.

### Prevenindo Vazamentos WebRTC no Pydoll

O Pydoll fornece múltiplas estratégias para prevenir vazamentos de IP via WebRTC.

**Método 1: Forçar o WebRTC a usar apenas rotas proxyadas (recomendado)**

```python
from pydoll.browser import Chrome
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.webrtc_leak_protection = True  # Adds --force-webrtc-ip-handling-policy=disable_non_proxied_udp
```

O Pydoll fornece uma propriedade conveniente `webrtc_leak_protection` que gerencia a flag do Chrome subjacente para você. Isso desabilita UDP se nenhum proxy o suportar, força o WebRTC a usar apenas retransmissores TURN (sem P2P direto) e previne consultas STUN para servidores públicos. A contrapartida é maior latência para chamadas de vídeo, já que conexões P2P diretas são desabilitadas.

**Método 2: Desabilitar o WebRTC inteiramente**

```python
options.add_argument('--disable-features=WebRTC')
```

Isso desabilita completamente a API WebRTC, eliminando qualquer possibilidade de vazamento de IP por este vetor. A contrapartida é que todos os sites dependentes de WebRTC (videoconferência, chamadas de voz) deixarão de funcionar. Note que esta flag deve ser testada com sua versão específica do Chrome, pois nomes de feature flags podem variar entre versões.

**Método 3: Restringir o WebRTC via preferências do navegador**

```python
options.browser_preferences = {
    'webrtc': {
        'ip_handling_policy': 'disable_non_proxied_udp',
        'multiple_routes_enabled': False,
        'nonproxied_udp_enabled': False,
        'allow_legacy_tls_protocols': False
    }
}
```

Isso alcança o mesmo efeito do Método 1, mas através de preferências em vez de flags de linha de comando. `multiple_routes_enabled` previne o uso de múltiplos caminhos de rede, e `nonproxied_udp_enabled` bloqueia UDP que não passa pelo proxy.

**Método 4: Usar um proxy SOCKS5 com suporte UDP**

```python
options.add_argument('--proxy-server=socks5://proxy.example.com:1080')
options.add_argument('--force-webrtc-ip-handling-policy=default_public_interface_only')
```

O SOCKS5 pode proxyar UDP via seu comando `UDP ASSOCIATE`, permitindo que as consultas STUN do WebRTC passem pelo proxy. Isso requer um proxy SOCKS5 que realmente suporte relay UDP, o que nem todos suportam.

!!! warning "Autenticação SOCKS5"
    O Chrome não suporta autenticação SOCKS5 inline (ex: `socks5://user:pass@host:port`) via a flag `--proxy-server`. O Pydoll fornece um `SOCKS5Forwarder` integrado que contorna essa limitação executando um proxy SOCKS5 local sem autenticação que encaminha o tráfego para o proxy remoto autenticado, cuidando do handshake de usuário/senha em nome do Chrome. Veja [Configuração de Proxy](../../features/configuration/proxy.md) para detalhes de uso.

### Testando Vazamentos WebRTC

Você pode testar manualmente visitando [browserleaks.com/webrtc](https://browserleaks.com/webrtc) e verificando se seu IP real aparece na seção "Public IP Address". Se você vir seu IP real em vez do IP do proxy, está havendo vazamento.

Para testes automatizados com o Pydoll:

```python
import asyncio
from pydoll.browser import Chrome
from pydoll.browser.options import ChromiumOptions

async def test_webrtc_leak():
    options = ChromiumOptions()
    options.add_argument('--proxy-server=http://proxy.example.com:8080')
    options.add_argument('--force-webrtc-ip-handling-policy=disable_non_proxied_udp')

    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://browserleaks.com/webrtc')

        await asyncio.sleep(3)

        ips = await tab.execute_script('''
            return Array.from(document.querySelectorAll('.ip-address'))
                .map(el => el.textContent.trim());
        ''')

        print("Detected IPs:", ips)
        # Should only show proxy IP, not your real IP

asyncio.run(test_webrtc_leak())
```

!!! danger "Sempre Teste Vazamentos WebRTC"
    Nunca assuma que sua configuração de proxy previne vazamentos WebRTC. Sempre verifique com [browserleaks.com/webrtc](https://browserleaks.com/webrtc) ou [ipleak.net](https://ipleak.net). Mesmo um único vazamento WebRTC compromete instantaneamente toda a sua configuração de proxy, já que o site agora conhece sua localização real, ISP e topologia de rede.

### Como Sites Exploram Vazamentos WebRTC

Sites podem intencionalmente acionar o WebRTC para extrair seu IP real usando poucas linhas de JavaScript:

```javascript
const pc = new RTCPeerConnection({
    iceServers: [{urls: 'stun:stun.l.google.com:19302'}]
});

pc.createDataChannel('');
pc.createOffer().then(offer => pc.setLocalDescription(offer));

pc.onicecandidate = (event) => {
    if (event.candidate) {
        const ipRegex = /([0-9]{1,3}(\.[0-9]{1,3}){3})/;
        const ipMatch = event.candidate.candidate.match(ipRegex);

        if (ipMatch) {
            const realIP = ipMatch[1];
            fetch(`/track?real_ip=${realIP}&proxy_ip=${window.clientIP}`);
        }
    }
};
```

Este código cria um RTCPeerConnection, aciona a coleta de candidatos ICE (que contata servidores STUN), extrai endereços IP dos candidatos com um regex e envia seu IP real para um servidor de rastreamento. Desabilitar o WebRTC ou forçar rotas apenas proxyadas como descrito acima previne isso.

## Resumo

Proxies operam em camadas específicas da pilha de rede: HTTP na Camada 7, SOCKS na Camada 5. A camada determina o que o proxy pode ver, modificar e ocultar. Fingerprints TCP (tamanho da janela, opções, TTL) vazam de camadas inferiores e revelam seu SO real mesmo através de um proxy. Tráfego UDP, incluindo WebRTC e DNS, frequentemente contorna proxies a menos que explicitamente configurado. O WebRTC é a fonte mais comum de vazamento de IP, e apenas SOCKS5 ou VPN podem proxyar tráfego UDP de forma eficaz. Navegadores modernos também usam QUIC (HTTP/3 sobre UDP), o que adiciona mais um vetor potencial de bypass.

**Próximos passos:**

- [Proxies HTTP/HTTPS](./http-proxies.md): Proxy de camada de aplicação
- [Proxies SOCKS](./socks-proxies.md): Proxy de camada de sessão, agnóstico a protocolo
- [Network Fingerprinting](../fingerprinting/network-fingerprinting.md): Técnicas de fingerprinting TCP/IP e TLS
- [Configuração de Proxy](../../features/configuration/proxy.md): Configuração prática de proxy no Pydoll

## Referências

- RFC 793: Transmission Control Protocol (TCP) - https://tools.ietf.org/html/rfc793
- RFC 768: User Datagram Protocol (UDP) - https://tools.ietf.org/html/rfc768
- RFC 8489: Session Traversal Utilities for NAT (STUN) - https://tools.ietf.org/html/rfc8489
- RFC 8445: Interactive Connectivity Establishment (ICE) - https://tools.ietf.org/html/rfc8445
- RFC 8656: Traversal Using Relays around NAT (TURN) - https://tools.ietf.org/html/rfc8656
- RFC 6528: Defending Against Sequence Number Attacks - https://tools.ietf.org/html/rfc6528
- RFC 9000: QUIC: A UDP-Based Multiplexed and Secure Transport - https://tools.ietf.org/html/rfc9000
- W3C WebRTC 1.0: Real-Time Communication Between Browsers - https://www.w3.org/TR/webrtc/
- BrowserLeaks: WebRTC Leak Test - https://browserleaks.com/webrtc
- IPLeak: Comprehensive Leak Testing - https://ipleak.net


================================================
FILE: docs/pt/deep-dive/network/proxy-detection.md
================================================
# Detecção de Proxy

A detecção de proxy é um processo probabilístico. Sites combinam dezenas de sinais para avaliar se uma conexão está sendo proxyada, desde simples consultas de reputação de IP até análise da pilha TCP/IP e perfil comportamental. Nenhum sinal isolado fornece prova definitiva, mas combinar sinais fracos suficientes produz decisões de alta confiança.

Este documento cobre as principais técnicas de detecção, como elas funcionam em nível técnico e o que significam para automação de navegador com o Pydoll.

!!! info "Navegação do Módulo"
    - [Proxies SOCKS](./socks-proxies.md): Proxying na camada de sessão
    - [Proxies HTTP/HTTPS](./http-proxies.md): Proxying na camada de aplicação
    - [Fundamentos de Rede](./network-fundamentals.md): TCP/IP, UDP, WebRTC

    Para detalhes sobre fingerprinting, veja [Network Fingerprinting](../fingerprinting/network-fingerprinting.md) e [Browser Fingerprinting](../fingerprinting/browser-fingerprinting.md).

## Reputação de IP

A análise de reputação de IP é a técnica de detecção de proxy mais amplamente implantada. Ela combina dados publicamente disponíveis (registros ASN, WHOIS, bancos de dados de geolocalização) com inteligência proprietária para classificar endereços IP em categorias de risco.

### Classificação por ASN

Todo endereço IP pertence a um Sistema Autônomo (AS), identificado por um ASN. O tipo de AS que possui um IP é o indicador individual mais forte de que ele é um proxy.

IPs pertencentes a provedores de nuvem e hospedagem (AWS, DigitalOcean, OVH, Hetzner) são sinalizados como alto risco porque usuários reais não navegam na web a partir de servidores de datacenter. IPs de ISPs residenciais (Comcast, Deutsche Telekom, BT) são baixo risco porque parecem conexões domésticas normais. IPs de operadoras móveis (Verizon Wireless, AT&T Mobility) são o risco mais baixo porque são os mais difíceis de distinguir de usuários móveis reais.

Alguns ASNs estão associados a infraestrutura conhecida de proxy, embora isso seja mais nuançado do que possa parecer. Grandes provedores de proxy residencial como BrightData ou Smartproxy não operam seus próprios ASNs; eles roteiam tráfego através de IPs residenciais reais pertencentes a ASNs de ISPs. Isso é precisamente o que torna proxies residenciais mais difíceis de detectar do que proxies de datacenter.

Sistemas de detecção consultam bancos de dados de ASN (Team Cymru, RIPE NCC, ARIN) e APIs comerciais de inteligência de IP para classificar cada IP conectando. IPs de datacenter são detectados com aproximadamente 95%+ de precisão porque a classificação por ASN é inequívoca. A detecção de proxy residencial é muito mais difícil (aproximadamente 40-70% de precisão) porque os IPs genuinamente pertencem a ISPs. A detecção de proxy móvel é a mais difícil (aproximadamente 20-40%) porque o NAT de operadoras móveis faz muitos usuários reais compartilharem IPs.

Esse gradiente de precisão é o motivo pelo qual proxies residenciais e móveis custam de 10 a 100 vezes o preço dos proxies de datacenter.

### Bancos de Dados de Proxies Conhecidos

Além da classificação por ASN, bancos de dados especializados rastreiam IPs que foram observados participando de redes de proxy. Serviços como IPQualityScore, proxycheck.io e Spur.us mantêm bancos de dados em tempo real de IPs conhecidos de proxy, VPN e nós de saída Tor. A lista de nós de saída Tor está disponível publicamente em [check.torproject.org](https://check.torproject.org/torbulkexitlist).

Esses bancos de dados também rastreiam sinais comportamentais: IPs que rotacionam frequentemente (típico de pools de proxy), IPs com contagens anormalmente altas de sessões concorrentes (um IP residencial normalmente tem 1-5 conexões concorrentes, não 100+) e IPs previamente associados a atividade semelhante a bot.

### Consistência de Geolocalização

Proxies frequentemente se revelam através de inconsistências geográficas. O endereço IP aponta para uma localização, mas os sinais reportados pelo navegador apontam para outra.

Os desencontros mais comuns são entre a geolocalização do IP e o fuso horário do navegador (coletado via `Intl.DateTimeFormat().resolvedOptions().timeZone` do JavaScript), entre o país do IP e o cabeçalho `Accept-Language`, e entre a localização da sessão atual e a localização de uma sessão anterior. Um usuário aparecendo em Los Angeles com fuso horário do navegador `Europe/Berlin` é suspeito. Um usuário aparecendo em Tóquio 10 minutos após sua última sessão ter sido em Nova York é fisicamente impossível.

Sistemas de detecção também verificam se a geolocalização do IP corresponde à configuração de localidade do navegador. Um IP de datacenter dos EUA com `Accept-Language: zh-CN` e fuso horário `Asia/Shanghai` sugere fortemente um usuário chinês roteando através de um proxy nos EUA.

!!! note "Falsos Positivos"
    Cenários legítimos disparam alarmes de geolocalização: viajantes usando VPNs, expatriados com configurações de navegador do país de origem, usuários corporativos conectando através de VPNs da empresa e usuários multilíngues com preferências de idioma não padrão. Sistemas sofisticados usam pontuação de risco em vez de bloqueio binário para lidar com esses casos.

## Análise de Cabeçalho HTTP

Cabeçalhos HTTP são o vetor de detecção mais simples. Proxies transparentes e anônimos adicionam cabeçalhos como `Via`, `X-Forwarded-For`, `X-Real-IP` e `Forwarded` (RFC 7239) que revelam diretamente o uso de proxy. Proxies elite removem esses cabeçalhos, mas sua ausência por si só não é prova de uma conexão direta.

A detecção vai além de procurar cabeçalhos específicos de proxy. Cabeçalhos ausentes que navegadores reais sempre enviam (como `Accept-Language`, `Accept-Encoding` ou um `User-Agent` realista) são suspeitos. A ordem dos cabeçalhos também importa: navegadores enviam cabeçalhos em uma ordem consistente e específica da versão, e proxies ou ferramentas de automação que constroem cabeçalhos manualmente frequentemente erram a ordem.

O cabeçalho legado `Proxy-Connection: keep-alive`, enviado por alguns clientes mais antigos ao rotear através de um proxy, é outro sinal clássico de detecção.

### Níveis de Anonimato de Proxy

Proxies são tradicionalmente classificados em três níveis de anonimato com base em seu comportamento de cabeçalhos:

| Nível | Comportamento | Detecção |
|-------|---------------|----------|
| Transparente | Encaminha seu IP real em `X-Forwarded-For`, adiciona cabeçalho `Via` | Trivial |
| Anônimo | Esconde seu IP mas adiciona `Via` ou outros cabeçalhos de proxy | Fácil |
| Elite | Remove todos os cabeçalhos identificadores de proxy | Requer análise mais profunda |

Essa classificação data de uma era em que a análise de cabeçalhos era o método primário de detecção. Sistemas modernos de detecção usam reputação de IP, fingerprinting e análise comportamental, tornando a distinção transparente/anônimo/elite menos significativa. Um proxy elite com IP de datacenter é detectado instantaneamente através de consulta ASN. Um proxy transparente em um IP residencial ainda pode passar despercebido em sites menos sofisticados.

## Network Fingerprinting

O fingerprinting na camada de rede opera abaixo da camada de proxy, o que significa que pode detectar proxies mesmo quando o proxy em si está configurado perfeitamente.

### Fingerprinting de TCP/IP

Cada sistema operacional tem uma implementação única da pilha TCP que se revela durante o handshake TCP. O tamanho inicial da janela, a ordem das opções TCP, o TTL (Time To Live) e o fator de escala de janela são todos definidos pelo kernel, não pelo navegador, e não podem ser alterados por um proxy.

Sistemas de detecção comparam essas características TCP com o cabeçalho `User-Agent`. Se o User-Agent alega Windows 10 mas o fingerprint TCP mostra características de Linux (TTL de 64, tamanho de janela de 29200), o desencontro é um forte indicador de proxy. O Windows usa um TTL padrão de 128 e versões modernas tipicamente mostram um tamanho de janela de 65535, enquanto o Linux usa TTL 64 e tamanhos de janela em torno de 29200.

A análise de TTL adiciona outra camada. O TTL diminui em 1 a cada salto de rede. Se uma conexão Windows chega com TTL de 128, o cliente provavelmente está na mesma rede. Se chega com TTL de 115, cruzou aproximadamente 13 saltos. Se o valor do TTL não se alinha com a contagem esperada de saltos para a localização geográfica do IP, roteamento por proxy é provável.

Para valores detalhados de fingerprint TCP e suas implicações, veja [Network Fingerprinting](../fingerprinting/network-fingerprinting.md).

### Fingerprinting de TLS (JA3/JA4)

A mensagem TLS ClientHello é transmitida em texto plano e contém parâmetros suficientes para identificar unicamente a aplicação cliente: versão TLS, conjuntos de cifras suportados, extensões, curvas elípticas e algoritmos de assinatura. O fingerprint JA3 é um hash MD5 desses parâmetros concatenados em uma ordem específica. JA4 é uma alternativa mais recente e mais granular.

Cada versão de navegador produz um fingerprint JA3/JA4 distinto. Sistemas de detecção mantêm bancos de dados de fingerprints conhecidos para Chrome, Firefox, Safari e outros navegadores. Se o fingerprint JA3 não corresponde a nenhum navegador conhecido, ou não corresponde ao navegador alegado no User-Agent, a conexão é sinalizada.

Uma nuance importante: proxies SOCKS5 e túneis HTTP CONNECT passam o TLS ClientHello sem modificação, então o servidor destino vê o fingerprint real do navegador. O proxy não altera os parâmetros TLS nessas configurações. Apenas proxies MITM (que terminam e reestabelecem TLS) mudam o fingerprint, e nesse caso o fingerprint pertence ao software do proxy, não a um navegador real, o que por si só é um sinal de detecção.

### Fingerprinting de HTTP/2

Conexões HTTP/2 expõem sinais de fingerprinting que são distintos do TLS. O frame SETTINGS enviado no início de uma conexão HTTP/2 contém parâmetros como `HEADER_TABLE_SIZE`, `MAX_CONCURRENT_STREAMS`, `INITIAL_WINDOW_SIZE` e `MAX_HEADER_LIST_SIZE`. Cada navegador usa valores padrão diferentes para essas configurações.

A ordem e prioridade dos pseudo-cabeçalhos (`:method`, `:authority`, `:scheme`, `:path`), o comportamento de compressão HPACK e os pesos de prioridade de stream também variam entre navegadores. Ferramentas como [browserleaks.com/http2](https://browserleaks.com/http2) mostram como é o seu fingerprint HTTP/2.

Frameworks de automação e software de proxy que implementam suas próprias pilhas HTTP/2 frequentemente produzem fingerprints que não correspondem a nenhum navegador real, tornando isso um vetor eficaz de detecção.

### Detecção Baseada em Latência

A latência de rede entre um cliente e um servidor revela informações sobre o caminho físico da rede. Se o IP geolocaliza em Nova York mas o tempo de ida e volta sugere um caminho pela Ásia, a conexão provavelmente está sendo proxyada.

Sistemas de detecção medem o RTT (round-trip time) durante o handshake TCP e comparam com latências esperadas para a localização geográfica do IP. Eles também podem emitir desafios de temporização baseados em JavaScript que medem a latência da perspectiva do navegador, e então comparar com a latência observada pelo servidor. Uma discrepância significativa entre as duas sugere um intermediário (proxy) no caminho.

A análise de desvio de relógio adiciona outra dimensão: ao medir o deslocamento do relógio do cliente via JavaScript (`Date.now()`) ou cabeçalhos HTTP `Date`, sistemas de detecção podem inferir o fuso horário real do cliente e compará-lo com o fuso horário esperado do IP.

## Detecção Comportamental

Os sistemas de detecção mais avançados vão além da análise de rede e protocolo para examinar o comportamento do usuário. Isso inclui temporização de requisições (as requisições estão espaçadas uniformemente, sugerindo automação?), padrões de movimento do mouse (analisados via listeners de eventos JavaScript), comportamento de rolagem, cadência de entrada do teclado e padrões gerais de navegação.

Modelos de machine learning treinados em milhões de sessões de usuários reais podem distinguir comportamento humano de automação com alta precisão. Esses modelos tipicamente combinam 50+ características incluindo padrões de navegação, distribuição de duração de sessão, posições de clique, temporização de interação com formulários e características de execução de JavaScript.

As interações humanizadas do Pydoll (movimento do mouse com curva de Bézier, temporização pela Lei de Fitts, digitação realista) são projetadas especificamente para passar na análise comportamental. Veja [Técnicas de Evasão](../fingerprinting/evasion-techniques.md) para a estratégia completa de evasão multicamada.

## Pontuação de Risco Multi-Sinal

Sistemas modernos de detecção não dependem de nenhuma técnica isolada. Eles combinam todos os sinais disponíveis em uma pontuação de risco, tipicamente de 0 a 100, e aplicam limiares que variam por indústria e contexto.

O peso de cada categoria de sinal varia, mas uma aproximação grosseira é que a reputação de IP representa a maior parcela (é o sinal mais barato e confiável), seguida por network fingerprinting (TCP/IP, TLS, HTTP/2), análise de cabeçalhos e protocolo, pontuação comportamental e verificações de consistência (geolocalização, fuso horário, idioma).

Os limiares dependem do contexto de negócio. Sites bancários bloqueiam agressivamente (pontuação de risco acima de 50), sites de e-commerce apresentam CAPTCHAs em pontuações moderadas (acima de 70), e sites de conteúdo tendem a ser mais permissivos (bloqueando apenas acima de 80) pois dependem de impressões de anúncios.

A implicação para automação é que passar em uma camada de detecção não é suficiente. Um IP residencial (boa reputação de IP) com um fingerprint TCP incompatível e comportamento robótico ainda será sinalizado. Evasão eficaz requer consistência em todas as camadas.

## Detecção por Tipo de Proxy

| Tipo de Proxy | Dificuldade de Detecção | Métodos Primários de Detecção |
|---------------|-------------------------|-------------------------------|
| HTTP Transparente | Trivial | Cabeçalhos HTTP (`Via`, `X-Forwarded-For`) |
| HTTP Anônimo | Fácil | Cabeçalhos HTTP + Reputação de IP |
| HTTP Elite (datacenter) | Médio | Reputação de IP (análise de ASN) |
| SOCKS5 Datacenter | Médio | Reputação de IP (análise de ASN) |
| Proxies residenciais | Difícil | Análise comportamental, padrões de conexão, latência |
| Proxies móveis | Muito difícil | Principalmente comportamental, sinais de rede limitados |
| Proxies rotativos | Difícil | Inconsistências de sessão, padrões de rotação de IP |

## Princípios de Evasão

Evasão eficaz é sobre consistência em todas as camadas de detecção, não sobre aperfeiçoar nenhuma camada individualmente.

Use IPs residenciais ou móveis quando a furtividade importar. Eles são mais difíceis de detectar porque os IPs genuinamente pertencem a ISPs, e o custo premium reflete essa vantagem. Alinhe os sinais de geolocalização do navegador (fuso horário, idioma, localidade) com a localização do IP do proxy. Mantenha persistência de sessão não rotacionando IPs no meio da sessão, o que cria descontinuidades detectáveis. Garanta que seu fingerprint TCP/IP corresponda à alegação do seu User-Agent executando automação no mesmo SO que você está imitando. Use as interações humanizadas do Pydoll para passar na análise comportamental. E sempre teste por vazamentos (WebRTC, DNS, fuso horário) antes de executar automação em escala.

O objetivo não é tornar a detecção impossível, mas sim torná-la cara e incerta. Force o sistema de detecção a usar múltiplos sinais correlacionados, misture-se com padrões de tráfego legítimo e crie negação plausível.

!!! warning "Nenhum Proxy é Indetectável"
    Com recursos suficientes, qualquer proxy pode ser detectado. Mesmo proxies residenciais de primeira linha alcançam aproximadamente 70-90% de taxa de sucesso contra sistemas anti-bot sofisticados como Akamai, Cloudflare Enterprise e DataDome. A questão prática é se a detecção é economicamente viável para o site alvo.

**Próximos passos:**

- [Network Fingerprinting](../fingerprinting/network-fingerprinting.md): Fingerprinting de TCP/IP e TLS em detalhes
- [Browser Fingerprinting](../fingerprinting/browser-fingerprinting.md): Fingerprinting de Canvas, WebGL, HTTP/2
- [Técnicas de Evasão](../fingerprinting/evasion-techniques.md): Estratégia de evasão multicamada
- [Configuração de Proxy](../../features/configuration/proxy.md): Configuração prática de proxy no Pydoll

## Referências

- MaxMind GeoIP2: https://www.maxmind.com/en/geoip2-services-and-databases
- IPQualityScore Proxy Detection: https://www.ipqualityscore.com/proxy-vpn-tor-detection-service
- Spur.us (Anonymous IP Detection): https://spur.us/
- Team Cymru IP to ASN Mapping: https://www.team-cymru.com/ip-asn-mapping
- Salesforce Engineering: TLS Fingerprinting with JA3 and JA3S - https://engineering.salesforce.com/tls-fingerprinting-with-ja3-and-ja3s-247362855967/
- Akamai: Passive Fingerprinting of HTTP/2 Clients (Black Hat EU 2017) - https://blackhat.com/docs/eu-17/materials/eu-17-Shuster-Passive-Fingerprinting-Of-HTTP2-Clients-wp.pdf
- Incolumitas: TCP/IP Fingerprinting for VPN and Proxy Detection - https://incolumitas.com/2021/03/13/tcp-ip-fingerprinting-for-vpn-and-proxy-detection/
- Incolumitas: Detecting Proxies and VPNs with Latencies - https://incolumitas.com/2021/06/07/detecting-proxies-and-vpn-with-latencies/
- BrowserLeaks HTTP/2 Fingerprint: https://browserleaks.com/http2
- BrowserLeaks IP: https://browserleaks.com/ip
- RFC 7239: Forwarded HTTP Extension - https://www.rfc-editor.org/rfc/rfc7239.html
- RFC 9110: HTTP Semantics - https://www.rfc-editor.org/rfc/rfc9110.html


================================================
FILE: docs/pt/deep-dive/network/proxy-legal.md
================================================
# Considerações Legais e Éticas

Este documento fornece **informações gerais** sobre o cenário legal e ético do uso de proxies e automação web. As leis variam enormemente por jurisdição e caso de uso. Isto **não é aconselhamento jurídico**. Sempre consulte um advogado qualificado para sua situação específica.

!!! info "Navegação do Módulo"
    - **[← Construindo Proxies](./build-proxy.md)** - Implementação e tópicos avançados
    - **[← Detecção de Proxy](./proxy-detection.md)** - Anonimato e evasão
    - **[← Visão Geral de Rede e Segurança](./index.md)** - Introdução do módulo
    
    Para automação responsável, veja **[Contorno de Captcha Comportamental](../../features/advanced/behavioral-captcha-bypass.md)** e **[Interações Semelhantes a Humanas](../../features/automation/human-interactions.md)**.

!!! danger "Aviso Legal"
    Este documento fornece **apenas informações educacionais**. **Não é aconselhamento jurídico**. As leis relativas a web scraping, automação e uso de proxy variam por jurisdição e estão sujeitas a interpretação. Consulte um advogado qualificado antes de se engajar em atividades que possam ter implicações legais.

## Considerações Legais e Éticas

O uso de proxy situa-se na interseção da privacidade, segurança e conformidade. Entender o cenário legal é essencial para uma automação responsável.

### Conformidade Regulatória

Diferentes jurisdições têm regras variadas sobre o uso de proxy e coleta de dados:

| Região | Regulação Chave | Implicações para Proxy |
|---|---|---|
| **União Europeia** | GDPR | Endereços IP são dados pessoais; nós de saída de proxy na UE devem cumprir |
| **Estados Unidos** | CFAA, Leis Estaduais | Contornar controles de acesso pode violar leis de fraude computacional |
| **China** | Lei de Cibersegurança | Uso de VPN/proxy fortemente regulamentado; apenas serviços aprovados permitidos |
| **Rússia** | Lei de VPN | Provedores de VPN devem se registrar e registrar a atividade do usuário |
| **Austrália** | Lei de Privacidade | Coleta de dados através de proxies sujeita a princípios de privacidade |

**Considerações específicas do GDPR:**

**Endereços IP como dados pessoais (Artigo 4):**

Ao raspar sites baseados na UE através de proxies:

- O IP da UE do seu proxy é considerado dado pessoal
- Sites devem manuseá-lo de acordo com os requisitos do GDPR
- Você deve ter base legal para a coleta de dados
- Princípio da minimização de dados se aplica

**Bases legais para processamento (Artigo 6):**

1.  **Consentimento** - Difícil de obter para scraping
2.  **Contrato** - Legítimo se você for um cliente
3.  **Obrigação legal** - Raro para casos de uso de scraping
4.  **Interesses vitais** - Não aplicável a scraping
5.  **Tarefa pública** - Não aplicável a scraping
6.  **Interesses legítimos** - Mais aplicável para scraping (requer teste de balanceamento)

### Termos de Serviço e Restrições de Acesso

Proxies não isentam você dos Termos de Serviço (ToS) do site:

**Violações comuns de ToS:**

1.  **Acesso Automatizado**: Muitos sites proíbem bots/scrapers independentemente do IP
2.  **Contorno de Limitação de Taxa (Rate Limiting)**: Usar proxies rotativos para contornar limites de taxa
3.  **Restrições Geográficas**: Contornar geo-bloqueios pode violar acordos de licenciamento de conteúdo
4.  **Compartilhamento de Conta**: Usar proxies para mascarar múltiplos usuários como um só

**Exemplos de precedentes legais:**

```python
# Casos notáveis (simplificado, não é aconselhamento jurídico)
cases = {
    'hiQ Labs v. LinkedIn (2022)': {
        'issue': 'Raspar dados públicos após acesso revogado',
        'outcome': 'Raspar dados publicamente disponíveis geralmente é permitido',
        'caveat': 'Mas contornar barreiras tecnológicas pode violar o CFAA'
    },
    
    'QVC v. Resultly (2020)': {
        'issue': 'Scraping agressivo causando carga no servidor',
        'outcome': 'Requisições excessivas constituem invasão de propriedade (trespass to chattels)',
        'implication': 'Volume e impacto importam, não apenas o acesso técnico'
    }
}
```

### Diretrizes Éticas para Uso de Proxy

Além da conformidade legal, considere estes princípios éticos:

**1. Respeite o robots.txt**
```python
# Mesmo com proxies, honre as diretrizes do site
async def ethical_scraping(url):
    # Checar robots.txt independentemente da anonimidade do proxy
    if not is_allowed_by_robots(url):
        return None  # Respeite os desejos do site
```

**2. Limitação de Taxa (Rate Limiting)**
```python
# Não abuse da rotação de proxy para sobrecarregar servidores
MINIMUM_DELAY = 1.0  # segundos entre requisições
MAX_CONCURRENT = 5   # conexões concorrentes por site

# Ruim: Rotacionar proxies para raspar a 1000 req/s
# Bom: Raspagem respeitosa mesmo com rotação de proxy
```

**3. Transparência**
```python
# Identifique-se no User-Agent quando apropriado
headers = {
    'User-Agent': 'MyBot/1.0 (contact@example.com)',  # Identificação honesta
    # Não: 'Mozilla/5.0...'  # Enganoso quando não é um navegador
}
```

**4. Minimização de Dados**
```python
# Colete apenas o que você precisa
# Só porque você pode raspar tudo, não significa que deva
data_to_collect = {
    'product_name': True,
    'price': True,
    'user_emails': False,      # PII - não colete a menos que necessário
    'user_addresses': False,   # PII - preocupações com privacidade
}
```

### Checklist de Conformidade

Antes de implantar automação baseada em proxy:

- [ ] **Revisão Legal**: Consulte aconselhamento jurídico para sua jurisdição
- [ ] **Conformidade com ToS**: Revise os termos de serviço do site alvo
- [ ] **Proteção de Dados**: Garanta conformidade com GDPR/CCPA se manusear dados pessoais
- [ ] **Direitos de Acesso**: Verifique se você tem permissão para acessar os dados
- [ ] **Limitação de Taxa**: Implemente taxas de requisição respeitosas
- [ ] **Tratamento de Erros**: Lide apropriadamente com 429 (Too Many Requests)
- [ ] **Logging**: Mantenha trilhas de auditoria para fins de conformidade
- [ ] **Retenção de Dados**: Implemente políticas apropriadas de retenção/exclusão de dados
- [ ] **Segurança**: Proteja os dados coletados com medidas apropriadas
- [ ] **Transparência**: Seja honesto sobre suas atividades de scraping quando questionado

!!! warning "Isto Não é Aconselhamento Jurídico"
    Esta seção fornece apenas informações gerais. A legalidade do uso de proxy varia por jurisdição, contexto e circunstâncias específicas. Sempre consulte um advogado qualificado para sua situação específica.

!!! tip "Uso Responsável de Proxy"
    O uso de proxy mais defensável é:
    
    - **Transparente**: Você pode explicar por que está fazendo isso
    - **Necessário**: Você tem uma razão legítima (pesquisa, monitoramento, etc.)
    - **Proporcional**: Seus métodos correspondem às suas necessidades (não excessivos)
    - **Documentado**: Você mantém registros de suas atividades
    - **Conforme (Compliant)**: Você segue todas as leis e ToS aplicáveis

### Quando Evitar Proxies

Alguns cenários onde o uso de proxy é problemático:

| Cenário | Risco | Alternativa |
|---|---|---|
| **Sites Bancários/Financeiros** | Detecção de fraude, suspensão de conta | Use apenas acesso legítimo |
| **Portais Governamentais** | Penalidades legais, investigações de segurança | Acesso direto de locais autorizados |
| **Dados de Saúde** | Violações HIPAA, penalidades severas | Use acesso API autorizado |
| **Sistemas Corporativos Internos** | Violações de política, demissão | Siga as políticas de TI da empresa |
| **Criação de Contas E-commerce** | Sinalizadores de fraude, banimentos permanentes | Use identidade única e verificada |

## Conclusão

Entender a arquitetura de proxy profundamente permite a você:

**Tomar Decisões Informadas:**
- Escolher o tipo de proxy certo para seu caso de uso
- Entender implicações de segurança
- Identificar quando proxies são necessários vs opcionais

**Solucionar Problemas Efetivamente:**
- Depurar problemas de conexão
- Identificar vazamentos de DNS ou IP
- Diagnosticar problemas de desempenho

**Otimizar Desempenho:**
- Configurar timeouts apropriados
- Implementar pooling de conexão
- Monitorar a saúde do proxy

**Construir Automação Melhor:**
- Combinar proxies com técnicas anti-detecção
- Implementar tratamento robusto de erros
- Escalar o uso de proxy eficientemente

O cenário de proxies é complexo, mas com esta fundação, você está equipado para navegá-lo com sucesso.

## Leitura Adicional

- **[RFC 1928](https://tools.ietf.org/html/rfc1928)**: Especificação do Protocolo SOCKS5
- **[RFC 1929](https://tools.ietf.org/html/rfc1929)**: Autenticação de Usuário/Senha SOCKS5
- **[RFC 2616](https://tools.ietf.org/html/rfc2616)**: HTTP/1.1 (método CONNECT)
- **[RFC 5389](https://tools.ietf.org/html/rfc5389)**: Protocolo STUN
- **[RFC 9298](https://tools.ietf.org/html/rfc9298)**: CONNECT-UDP (proxying HTTP/3)
- **[Guia de Configuração de Proxy](../features/configuration/proxy.md)**: Uso prático de proxy no Pydoll, autenticação, rotação e testes
- **[Interceptação de Requisições](../features/network/interception.md)**: Como o Pydoll implementa autenticação de proxy internamente
- **[Análise Profunda das Capacidades de Rede](./network-capabilities.md)**: Como o Pydoll lida com operações de rede

!!! tip "Experimentação"
    A melhor maneira de entender proxies verdadeiramente é:
    
    1. Configurar seu próprio servidor proxy (use o código acima)
    2. Capturar tráfego com Wireshark para ver os pacotes brutos
    3. Testar diferentes tipos de proxy com automação real
    4. Criar vazamentos intencionalmente e aprender a detectá-los
    
    A experiência prática solidifica o conhecimento teórico!

================================================
FILE: docs/pt/deep-dive/network/socks-proxies.md
================================================
# Arquitetura do Protocolo SOCKS

SOCKS (SOCKet Secure) é um protocolo de proxy que opera entre as camadas de transporte e aplicação da pilha de rede (comumente descrito como Camada 5 no modelo OSI). Diferente dos proxies HTTP, que analisam e compreendem o tráfego HTTP, os proxies SOCKS encaminham conexões TCP e UDP brutas sem inspecionar seu conteúdo. Esse design agnóstico a protocolo torna o SOCKS a escolha preferida para automação focada em privacidade: o proxy nunca precisa analisar suas requisições, injetar cabeçalhos ou terminar conexões TLS.

Este documento cobre como o SOCKS funciona no nível do protocolo, as diferenças entre SOCKS4 e SOCKS5, o tratamento de autenticação no Chrome, o comportamento de resolução de DNS e a configuração prática no Pydoll.

!!! info "Navegação do Módulo"
    - [Proxies HTTP/HTTPS](./http-proxies.md): Proxy na camada de aplicação
    - [Fundamentos de Rede](./network-fundamentals.md): TCP/IP, UDP, modelo OSI
    - [Visão Geral de Rede e Segurança](./index.md): Introdução do módulo
    - [Detecção de Proxy](./proxy-detection.md): Níveis de anonimato e evasão de detecção
    - [Construindo Proxies](./build-proxy.md): Implementação do SOCKS5 do zero

    Para configuração prática, veja [Configuração de Proxy](../../features/configuration/proxy.md).

## Como o SOCKS Difere dos Proxies HTTP

A diferença fundamental está no que cada proxy pode ver e fazer. Um proxy HTTP opera na camada de aplicação e compreende HTTP: ele pode ler URLs, cabeçalhos, cookies e corpos de requisição (para tráfego não criptografado), modificá-los em trânsito, armazenar respostas em cache e injetar seus próprios cabeçalhos como `Via` e `X-Forwarded-For`. Isso é poderoso para filtragem de conteúdo, mas significa que você precisa confiar no operador do proxy com os dados da sua aplicação.

Um proxy SOCKS opera abaixo da camada de aplicação. Ele vê apenas o endereço de destino, a porta e o volume de dados sendo transferido. Ele não analisa, modifica ou sequer compreende qual protocolo está fluindo através dele. HTTP, HTTPS, FTP, SSH, WebSocket ou qualquer protocolo customizado parecem todos iguais para um proxy SOCKS: apenas bytes sendo retransmitidos entre dois endpoints.

Isso tem uma implicação prática direta. Quando você envia uma requisição HTTPS através de um proxy SOCKS5, o proxy vê `example.com:443` e o fluxo TLS criptografado. Ele não consegue ler a URL, os cabeçalhos, os cookies ou o conteúdo da resposta. Ele não adiciona cabeçalhos identificadores. Ele não precisa terminar o TLS. O túnel criptografado funciona de ponta a ponta entre seu navegador e o servidor de destino.

No entanto, é importante entender o que o SOCKS não fornece. SOCKS é um protocolo de proxy, não um protocolo de criptografia. O nome "SOCKet Secure" refere-se à travessia segura de firewalls, não à segurança criptográfica. Se você enviar tráfego HTTP não criptografado através de um proxy SOCKS5, o operador do proxy pode ler os bytes passando através dele, mesmo que o proxy não tenha sido projetado para inspecioná-los. Para criptografia real, você precisa de TLS/HTTPS sobre SOCKS, ou de um túnel criptografado (SSH, VPN) envolvendo a conexão SOCKS.

!!! note "Modelo de Confiança"
    Com proxies HTTP, você confia no operador do proxy para não registrar seu histórico de navegação, roubar tokens, modificar respostas ou realizar ataques MITM. Com SOCKS5, você confia no proxy apenas para encaminhar pacotes corretamente e não registrar metadados de conexão. A superfície de ataque é menor, mas não é zero.

## SOCKS4 vs SOCKS5

O SOCKS possui duas versões de uso comum. O SOCKS4 foi desenvolvido pela NEC no início dos anos 1990 como um padrão informal sem RFC. O SOCKS5 foi padronizado como RFC 1928 em 1996 para resolver as limitações do SOCKS4.

| Característica | SOCKS4 | SOCKS5 |
|---------|--------|--------|
| Padrão | Sem RFC oficial (de facto, 1992) | RFC 1928 (1996) |
| Autenticação | Apenas identificação (campo USERID, sem senha) | Múltiplos métodos (nenhum, usuário/senha, GSSAPI) |
| Versão IP | Apenas IPv4 | IPv4 e IPv6 |
| Suporte UDP | Não | Sim (comando UDP ASSOCIATE) |
| Resolução DNS | Lado do cliente (extensão SOCKS4A adiciona lado do servidor) | Lado do servidor ao usar nomes de domínio (ATYP=0x03) |
| Suporte a protocolo | Apenas TCP | TCP e UDP |

O SOCKS5 é superior em todos os aspectos práticos. Use SOCKS4 apenas se o proxy não suportar SOCKS5.

## O Handshake SOCKS5

O processo de conexão SOCKS5 segue a RFC 1928 e consiste em três fases: negociação de método, autenticação opcional e a requisição de conexão.

```mermaid
sequenceDiagram
    participant Client
    participant SOCKS5 as SOCKS5 Proxy
    participant Server as Target Server

    Note over Client,SOCKS5: Phase 1: Method Negotiation
    Client->>SOCKS5: Hello [VER=5, NMETHODS, METHODS]
    SOCKS5->>Client: Method Selected [VER=5, METHOD]

    Note over Client,SOCKS5: Phase 2: Authentication (if required)
    Client->>SOCKS5: Auth Request [VER=1, ULEN, UNAME, PLEN, PASSWD]
    SOCKS5->>Client: Auth Response [VER=1, STATUS]

    Note over Client,SOCKS5: Phase 3: Connection Request
    Client->>SOCKS5: Connect [VER=5, CMD=CONNECT, DST.ADDR, DST.PORT]
    SOCKS5->>Server: Establish TCP connection
    Server-->>SOCKS5: Connection established
    SOCKS5->>Client: Reply [VER=5, REP=SUCCESS, BND.ADDR, BND.PORT]

    Note over Client,Server: Data relay (proxied)
    Client->>SOCKS5: Application data
    SOCKS5->>Server: Forward data
    Server->>SOCKS5: Response data
    SOCKS5->>Client: Forward response
```

### Fase 1: Negociação de Método

O cliente abre uma conexão TCP com o proxy e envia uma saudação contendo a versão do protocolo (sempre `0x05` para SOCKS5) e uma lista de métodos de autenticação que ele suporta.

```python
# Client Hello
[
    0x05,        # VER: Protocol version (5)
    0x02,        # NMETHODS: Number of methods offered
    0x00, 0x02   # METHODS: No auth (0x00) and Username/Password (0x02)
]
```

O proxy responde com o método que ele seleciona. Se o proxy exigir autenticação e o cliente tiver oferecido `0x02` (usuário/senha), o proxy o seleciona. Se nenhum método aceitável foi oferecido, o proxy responde com `0xFF` e fecha a conexão.

```python
# Server response
[
    0x05,   # VER: Protocol version (5)
    0x02    # METHOD: Username/Password selected
]
```

Códigos de método definidos pela RFC 1928: `0x00` = sem autenticação, `0x01` = GSSAPI, `0x02` = usuário/senha (RFC 1929), `0x03-0x7F` = atribuídos pela IANA, `0x80-0xFE` = reservados para métodos privados, `0xFF` = nenhum método aceitável.

### Fase 2: Autenticação

Se o proxy selecionou o método `0x02`, o cliente envia as credenciais seguindo a RFC 1929. A subnegociação usa seu próprio número de versão (`0x01`, não `0x05`).

```python
# Client authentication
[
    0x01,              # VER: Subnegotiation version (1)
    len(username),     # ULEN: Username length (max 255)
    *username_bytes,   # UNAME: Username
    len(password),     # PLEN: Password length (max 255)
    *password_bytes    # PASSWD: Password
]

# Server response
[
    0x01,   # VER: Subnegotiation version (1)
    0x00    # STATUS: 0 = success, non-zero = failure
]
```

As credenciais são transmitidas em texto claro durante este handshake. Isso é inerente ao protocolo SOCKS5 (RFC 1929). Para ambientes sensíveis, envolva a conexão SOCKS em um túnel SSH ou VPN.

### Fase 3: Requisição de Conexão

Após a autenticação ser bem-sucedida (ou se nenhuma autenticação foi necessária), o cliente envia uma requisição de conexão especificando o comando, o endereço de destino e a porta.

```python
[
    0x05,          # VER: Protocol version (5)
    0x01,          # CMD: 1=CONNECT, 2=BIND, 3=UDP ASSOCIATE
    0x00,          # RSV: Reserved
    0x03,          # ATYP: 1=IPv4 (4 bytes), 3=Domain (length+name), 4=IPv6 (16 bytes)
    len(domain),   # Domain length (only for ATYP=0x03)
    *domain_bytes, # Domain name
    *port_bytes    # Port (2 bytes, big-endian)
]
```

O tipo de endereço (ATYP) determina o formato: `0x01` significa que 4 bytes de endereço IPv4 seguem, `0x04` significa 16 bytes de IPv6, e `0x03` significa um byte de comprimento seguido pelo nome do domínio. Quando o cliente envia um nome de domínio (ATYP=0x03), o proxy resolve o DNS do seu lado, o que previne vazamentos de DNS para a rede local do cliente.

O proxy conecta ao destino e responde com uma resposta:

```python
[
    0x05,       # VER: Protocol version (5)
    0x00,       # REP: 0x00=success, 0x01-0x08=various errors
    0x00,       # RSV: Reserved
    0x01,       # ATYP: Address type of bound address
    *bind_addr, # BND.ADDR: Address the proxy bound to
    *bind_port  # BND.PORT: Port the proxy bound to
]
```

Códigos de resposta: `0x00` sucesso, `0x01` falha geral, `0x02` conexão não permitida, `0x03` rede inacessível, `0x04` host inacessível, `0x05` conexão recusada, `0x06` TTL expirado, `0x07` comando não suportado, `0x08` tipo de endereço não suportado.

Após uma resposta bem-sucedida, o proxy começa a retransmitir dados bidirecionalmente. Todo o handshake SOCKS5 é um protocolo binário, tornando-o mais eficiente que o HTTP baseado em texto, mas mais difícil de depurar sem dumps hexadecimais.

## Suporte UDP

O SOCKS5 suporta proxy UDP através do comando `UDP ASSOCIATE` (CMD=0x03). Isso funciona de forma diferente do proxy TCP: o cliente envia uma requisição UDP ASSOCIATE pela conexão de controle TCP, e o proxy responde com um endereço e porta de retransmissão. O cliente então envia datagramas UDP para essa retransmissão, e o proxy os encaminha para seus destinos.

```mermaid
sequenceDiagram
    participant Client
    participant SOCKS5
    participant UDP_Server as UDP Server

    Note over Client,SOCKS5: TCP control connection (handshake + auth)
    Client->>SOCKS5: UDP ASSOCIATE request (CMD=0x03)
    SOCKS5->>Client: Relay address and port

    Note over Client,SOCKS5: UDP data transfer
    Client->>SOCKS5: UDP datagram to relay
    SOCKS5->>UDP_Server: Forward datagram
    UDP_Server->>SOCKS5: Response datagram
    SOCKS5->>Client: Forward response

    Note over Client,SOCKS5: TCP control connection stays open
```

Cada datagrama UDP enviado através da retransmissão inclui um pequeno cabeçalho com o endereço e a porta de destino:

```python
[
    0x00, 0x00,    # RSV: Reserved
    0x00,          # FRAG: Fragment number (0 = no fragmentation)
    0x01,          # ATYP: Address type
    *dst_addr,     # DST.ADDR: Destination address
    *dst_port,     # DST.PORT: Destination port
    *data          # DATA: Application data
]
```

A conexão de controle TCP deve permanecer aberta durante toda a duração da associação UDP. Se ela for fechada, o proxy descarta a retransmissão UDP.

!!! warning "UDP no Chrome"
    O Chrome não utiliza UDP ASSOCIATE do SOCKS5 para nenhum tráfego. Mesmo quando configurado com um proxy SOCKS5, o Chrome apenas faz proxy de conexões TCP. WebRTC, DNS-sobre-UDP e outros tráfegos UDP não são roteados pelo proxy SOCKS5. Isso significa que vazamentos de IP via WebRTC ainda são possíveis com SOCKS5 no Chrome. Use `--force-webrtc-ip-handling-policy=disable_non_proxied_udp` ou `webrtc_leak_protection = True` do Pydoll para mitigar isso. Para mais detalhes, veja [Fundamentos de Rede: WebRTC e Vazamento de IP](./network-fundamentals.md#webrtc-and-ip-leakage).

!!! tip "Alternativas Modernas de Proxy UDP"
    Para cenários que exigem suporte UDP completo além do que a implementação SOCKS5 do Chrome oferece, considere Shadowsocks (protocolo criptografado semelhante ao SOCKS com UDP nativo), WireGuard (VPN com excelente desempenho) ou V2Ray/VMess (framework de proxy flexível com tratamento UDP abrangente).

## Resolução de DNS

Um equívoco comum é que proxies HTTP vazam consultas DNS enquanto proxies SOCKS5 não. A realidade no Chrome é mais nuançada.

Quando o Chrome é configurado com qualquer proxy (HTTP, HTTPS ou SOCKS5), ele envia nomes de host para o proxy em vez de resolver DNS localmente. Para proxies HTTP, o nome do host aparece na requisição `CONNECT host:443`. Para SOCKS5, ele aparece na requisição de conexão com ATYP=0x03 (nome de domínio). Em ambos os casos, o proxy resolve o DNS do seu lado, e o Chrome não faz consultas DNS locais para tráfego direcionado ao proxy.

A verdadeira diferença de privacidade de DNS entre os dois tipos de proxy não é quem resolve o DNS, mas o que o proxy vê na camada de aplicação. Um proxy HTTP vê a URL completa para requisições não criptografadas e o nome do host para requisições CONNECT. Um proxy SOCKS5 vê apenas o nome do host de destino e a porta como parâmetros opacos de conexão.

No entanto, existe uma ressalva importante: o prefetcher de DNS do Chrome pode fazer consultas DNS locais para nomes de host encontrados no conteúdo da página, mesmo quando um proxy está configurado. Isso pode vazar os domínios que você está navegando para o seu resolvedor DNS local. Para prevenir isso, desabilite o prefetching de DNS ou use a flag `--host-resolver-rules="MAP * ~NOTFOUND , EXCLUDE 127.0.0.1"`.

!!! note "`socks5://` vs `socks5h://`"
    Muitas ferramentas fora do Chrome distinguem entre `socks5://` (cliente resolve DNS) e `socks5h://` (proxy resolve DNS, o "h" significa hostname). O Chrome sempre resolve DNS do lado do proxy para SOCKS5, comportando-se como `socks5h://` independentemente de qual esquema você use. Mas se você usar ferramentas como `curl`, Firefox ou bibliotecas Python junto com o Pydoll, a distinção importa: sempre use `socks5h://` para prevenir vazamentos de DNS.

## SOCKS5 e Resistência a MITM

O SOCKS5 é frequentemente descrito como "resistente a MITM". Isso é verdade em um sentido específico: como o SOCKS5 não compreende nem interage com TLS, ele não tem mecanismo para terminar uma conexão TLS e recriptografá-la. Um proxy SOCKS5 simplesmente retransmite bytes criptografados sem modificação.

Um proxy HTTP, por outro lado, pode realizar terminação TLS (MITM) apresentando seu próprio certificado ao cliente, descriptografando o tráfego, inspecionando ou modificando-o, e recriptografando-o em direção ao servidor. Isso exige que o cliente confie no certificado CA do proxy, e é detectável através de certificate pinning e logs de Certificate Transparency. O comportamento normal de um proxy HTTP com HTTPS (usando CONNECT) é criar um túnel transparente sem terminação, mas a possibilidade arquitetônica de MITM existe.

Com SOCKS5, a terminação TLS não é possível no nível do protocolo. O proxy não consegue se inserir no handshake TLS porque ele não analisa os dados da aplicação fluindo através dele. A criptografia de ponta a ponta entre cliente e servidor é preservada por design.

Vale notar que é o TLS que fornece a proteção criptográfica real, não o SOCKS5 em si. Se você enviar HTTP não criptografado através de um proxy SOCKS5, o operador do proxy pode ler tudo. A vantagem de segurança do SOCKS5 é arquitetônica (ele não exige nem permite terminação TLS), não criptográfica.

## TLS e Browser Fingerprinting Através do SOCKS5

Uma limitação importante para entender: o SOCKS5 não altera o fingerprint do seu navegador. O handshake TLS (ClientHello) passa pelo proxy SOCKS5 byte por byte, o que significa que o servidor de destino vê o fingerprint JA3/JA4 exato do seu navegador. O mesmo se aplica aos frames HTTP/2 SETTINGS, à ordenação de cabeçalhos específica do navegador e a todos os outros sinais de fingerprinting na camada de aplicação.

O SOCKS5 oculta seu endereço IP e impede que o proxy injete cabeçalhos identificadores. Ele não ajuda com nenhuma forma de browser fingerprinting ou fingerprinting comportamental. Para uma estratégia completa de evasão, você precisa abordar o fingerprinting em múltiplas camadas. Veja [Técnicas de Evasão](../fingerprinting/evasion-techniques.md) para detalhes.

## Autenticação SOCKS5 no Chrome

O Chrome não suporta autenticação por usuário/senha do SOCKS5. Esta é uma limitação de longa data rastreada como [Chromium Issue #40323993](https://issues.chromium.org/issues/40323993). Quando o Chrome realiza a negociação de método SOCKS5, ele oferece apenas o método `0x00` (sem autenticação). Se o proxy exigir autenticação, a conexão falha silenciosamente.

Isso é fundamentalmente diferente da autenticação de proxy HTTP. Proxies HTTP autenticam via códigos de status HTTP (`407 Proxy Authentication Required`), que o Chrome trata através do domínio Fetch no CDP. O Pydoll intercepta esses eventos `Fetch.authRequired` e responde com as credenciais armazenadas automaticamente. A autenticação SOCKS5, por outro lado, acontece durante um handshake de protocolo binário na camada de sessão, antes que qualquer tráfego HTTP exista. Não há HTTP 407, nenhum evento `Fetch.authRequired` e nenhuma forma de ferramentas baseadas em CDP injetarem credenciais nesse processo.

Configurar `--proxy-server=socks5://user:pass@proxy:1080` não funciona. O Chrome ignora silenciosamente as credenciais embutidas.

### SOCKS5Forwarder do Pydoll

A solução padrão é um proxy forwarder local: um servidor SOCKS5 leve rodando no localhost que aceita conexões não autenticadas do Chrome e as encaminha para o proxy remoto com autenticação completa.

```mermaid
sequenceDiagram
    participant Chrome
    participant Forwarder as Local Forwarder<br/>(127.0.0.1:1081)
    participant Remote as Remote SOCKS5 Proxy<br/>(proxy:1080)
    participant Server as Destination Server

    Note over Chrome,Forwarder: No authentication
    Chrome->>Forwarder: SOCKS5 Hello [methods: 0x00]
    Forwarder->>Chrome: Method selected [0x00]
    Chrome->>Forwarder: CONNECT example.com:443

    Note over Forwarder,Remote: With authentication
    Forwarder->>Remote: SOCKS5 Hello [methods: 0x02]
    Remote->>Forwarder: Method selected [0x02]
    Forwarder->>Remote: Auth [username, password]
    Remote->>Forwarder: Auth OK
    Forwarder->>Remote: CONNECT example.com:443
    Remote->>Server: TCP connection
    Remote->>Forwarder: Connect OK

    Forwarder->>Chrome: Connect OK

    Note over Chrome,Server: Bidirectional data relay
    Chrome->>Forwarder: TLS + application data
    Forwarder->>Remote: Forward
    Remote->>Server: Forward
    Server->>Remote: Response
    Remote->>Forwarder: Forward
    Forwarder->>Chrome: Forward
```

O Pydoll fornece um `SOCKS5Forwarder` integrado no módulo `pydoll.utils`. É uma implementação async pura em Python, sem dependências externas, que lida com o handshake SOCKS5 completo com o proxy remoto, incluindo autenticação por usuário/senha (RFC 1929), tipos de endereço IPv4, IPv6 e domínio.

```python
import asyncio
from pydoll.utils import SOCKS5Forwarder
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def main():
    forwarder = SOCKS5Forwarder(
        remote_host='proxy.example.com',
        remote_port=1080,
        username='myuser',
        password='mypass',
        local_port=1081,  # Use 0 for auto-assigned port
    )
    async with forwarder:
        options = ChromiumOptions()
        options.add_argument(f'--proxy-server=socks5://127.0.0.1:{forwarder.local_port}')

        async with Chrome(options=options) as browser:
            tab = await browser.start()
            await tab.go_to('https://httpbin.org/ip')

asyncio.run(main())
```

O forwarder também pode ser executado como ferramenta CLI standalone para testes ou uso com outras aplicações:

```bash
python -m pydoll.utils.socks5_proxy_forwarder \
    --remote-host proxy.example.com \
    --remote-port 1080 \
    --username myuser \
    --password mypass \
    --local-port 1081
```

O forwarder se vincula a `127.0.0.1` por padrão, tornando-o acessível apenas da sua máquina. Nunca vincule a `0.0.0.0` em produção, pois isso exporia um proxy SOCKS5 sem autenticação para a rede. As credenciais nunca são registradas em texto claro nos logs. O forwarder adiciona latência sub-milissegundo, já que toda a comunicação acontece pela interface de loopback local.

!!! tip "Ambientes Restritos"
    Alguns ambientes (contêineres Docker, plataformas serverless, VMs endurecidas) podem restringir a vinculação a portas locais. Use `local_port=0` para deixar o SO atribuir uma porta disponível. Se a vinculação local estiver completamente bloqueada, considere usar um proxy HTTP CONNECT, que o Chrome suporta nativamente com autenticação via ProxyManager do Pydoll.

## Configuração Prática

**SOCKS5 básico (sem autenticação):**

```python
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.add_argument('--proxy-server=socks5://proxy.example.com:1080')

async with Chrome(options=options) as browser:
    tab = await browser.start()
    await tab.go_to('https://example.com')
```

**SOCKS5 com autenticação (via SOCKS5Forwarder):**

Veja a [seção do SOCKS5Forwarder](#socks5forwarder-do-pydoll) acima.

**Prevenindo vazamentos:**

Para uma configuração SOCKS5 completa, você também deve prevenir vazamentos de WebRTC e DNS prefetch:

```python
options = ChromiumOptions()
options.add_argument('--proxy-server=socks5://proxy.example.com:1080')
options.webrtc_leak_protection = True  # Prevents WebRTC IP leaks
options.add_argument('--disable-quic')  # Forces HTTP/2 over TCP through proxy
```

**Testando sua configuração:**

Sempre verifique sua configuração de proxy com testes de vazamento. Visite [browserleaks.com/ip](https://browserleaks.com/ip) para confirmar seu IP, [browserleaks.com/webrtc](https://browserleaks.com/webrtc) para verificar vazamentos de WebRTC, e [dnsleaktest.com](https://dnsleaktest.com/) para confirmar que o DNS não está vazando.

## Resumo

O SOCKS5 fornece proxy agnóstico a protocolo com uma superfície de confiança menor que a dos proxies HTTP. Ele não analisa, modifica ou injeta nada no seu tráfego. A resolução de DNS acontece do lado do proxy no Chrome. A criptografia TLS é preservada de ponta a ponta. A principal limitação no Chrome é a falta de autenticação SOCKS5 nativa (resolvida pelo `SOCKS5Forwarder` do Pydoll) e a ausência de proxy UDP (mitigada desabilitando o WebRTC ou usando as flags apropriadas do navegador).

O SOCKS5 não altera o fingerprint TLS do seu navegador, as configurações HTTP/2 ou quaisquer características da camada de aplicação. Para evasão completa, combine SOCKS5 com gerenciamento de browser fingerprint e simulação comportamental.

**Próximos passos:**

- [Detecção de Proxy](./proxy-detection.md): Como até mesmo proxies SOCKS5 podem ser detectados
- [Construindo Proxies](./build-proxy.md): Implemente seu próprio servidor SOCKS5
- [Configuração de Proxy](../../features/configuration/proxy.md): Configuração prática de proxy no Pydoll
- [Técnicas de Evasão](../fingerprinting/evasion-techniques.md): Estratégia de evasão multicamada

## Referências

- RFC 1928: SOCKS Protocol Version 5 (1996) - https://datatracker.ietf.org/doc/html/rfc1928
- RFC 1929: Username/Password Authentication for SOCKS V5 (1996) - https://datatracker.ietf.org/doc/html/rfc1929
- RFC 1961: GSS-API Authentication Method for SOCKS V5 (1996) - https://datatracker.ietf.org/doc/html/rfc1961
- RFC 3089: SOCKS-based IPv6/IPv4 Gateway Mechanism (2001) - https://datatracker.ietf.org/doc/html/rfc3089
- Chromium Proxy Documentation - https://chromium.googlesource.com/chromium/src/+/689912289c/net/docs/proxy.md
- Chromium Issue #40323993: SOCKS5 Authentication - https://issues.chromium.org/issues/40323993
- BrowserLeaks: WebRTC Leak Test - https://browserleaks.com/webrtc
- DNS Leak Test - https://dnsleaktest.com/
- IPLeak: Comprehensive Leak Testing - https://ipleak.net


================================================
FILE: docs/pt/features/advanced/behavioral-captcha-bypass.md
================================================
# Interação com Cloudflare Turnstile

O Pydoll oferece suporte nativo para interagir com captchas Cloudflare Turnstile realizando cliques realistas do navegador. Isso **não é um bypass ou evasão**. Ele simplesmente automatiza a mesma ação de clique que um humano realizaria na caixa de seleção do captcha.

!!! warning "O que esta Funcionalidade Realmente Faz"
    Esta funcionalidade **clica** na caixa de seleção do captcha Cloudflare Turnstile usando interações padrão do navegador. É isso. Não há:
    
    - **NÃO**: Bypass mágico ou evasão
    - **NÃO**: Resolução de desafios (seleção de imagens, quebra-cabeças, etc.)
    - **NÃO**: Manipulação de pontuação ou falsificação de fingerprint
    - **SIM**: Apenas um clique realista no contêiner do captcha
    
    **O sucesso depende inteiramente do seu ambiente** (reputação do IP, fingerprint do navegador, padrões de comportamento). O Pydoll fornece o mecanismo para clicar; seu ambiente determina se o clique é aceito.

!!! info "O que é o Cloudflare Turnstile?"
    O Cloudflare Turnstile é um sistema de captcha moderno que analisa o ambiente do navegador e sinais comportamentais para determinar se você é humano. Ele geralmente aparece como uma caixa de seleção que os usuários devem clicar. O sistema analisa:
    
    - **Reputação do IP**: Seu endereço IP está sinalizado ou é suspeito?
    - **Fingerprint do Navegador**: Seu navegador parece legítimo?
    - **Padrões Comportamentais**: Você se comporta como um humano?
    
    Quando a pontuação de confiança é alta o suficiente, o clique na caixa de seleção é aceito. Quando está muito baixa, o Turnstile pode mostrar um desafio (que o Pydoll **não pode resolver**) ou bloqueá-lo totalmente. Para resolver desafios com imagens ou quebra-cabeças, considere usar o **[CapSolver](https://dashboard.capsolver.com/passport/register?inviteCode=WPhTbOsbXEpc)**.

## Guia Rápido

### Gerenciador de Contexto (Recomendado)

O gerenciador de contexto espera o captcha aparecer, clica nele e espera pela resolução antes de continuar:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def turnstile_example():
    options = ChromiumOptions()
    options.add_argument('--disable-blink-features=AutomationControlled')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Gerenciador de contexto lida com o captcha automaticamente
        async with tab.expect_and_bypass_cloudflare_captcha():
            await tab.go_to('https://site-with-turnstile.com')
        
        # Este código só roda após o captcha ser clicado
        print("Interação com o captcha Turnstile concluída!")
        
        # Continue com sua automação
        content = await tab.find(id='protected-content')
        print(await content.text)

asyncio.run(turnstile_example())
```

### Processamento em Segundo Plano

Habilite o clique automático do captcha em segundo plano:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def background_turnstile():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Habilitar clique automático antes de navegar
        await tab.enable_auto_solve_cloudflare_captcha()
        
        # Navegar para o site protegido
        await tab.go_to('https://site-with-turnstile.com')
        
        # Esperar o captcha ser processado em segundo plano
        await asyncio.sleep(5)
        
        print("Página carregada com manejo de captcha em segundo plano")
        
        # Desabilitar quando não for mais necessário
        await tab.disable_auto_solve_cloudflare_captcha()

asyncio.run(background_turnstile())
```

## Personalizando a Interação com o Captcha

### Como Funciona

O Pydoll detecta automaticamente o Cloudflare Turnstile percorrendo o shadow DOM da página. Ele procura um shadow root contendo `challenges.cloudflare.com`, navega até seu iframe cross-origin, encontra o shadow root interno e clica no elemento checkbox real. Nenhuma configuração manual de seletor é necessária.

### Configuração de Tempo (Timing)

O shadow root do captcha nem sempre aparece imediatamente. Ajuste o timeout para corresponder ao comportamento do site:

```python
async def timing_configuration_example():
    async with Chrome() as browser:
        tab = await browser.start()

        async with tab.expect_and_bypass_cloudflare_captcha(
            time_to_wait_captcha=10   # Esperar até 10 segundos pelo captcha aparecer (padrão: 5)
        ):
            await tab.go_to('https://site-with-slow-turnstile.com')

        print("Interação com o captcha concluída com tempo personalizado!")

asyncio.run(timing_configuration_example())
```

**Referência de Parâmetros:**

| Parâmetro | Tipo | Padrão | Descrição |
|---|---|---|---|
| `time_to_wait_captcha` | `float` | `5` | Segundos máximos para esperar o captcha aparecer |

!!! info "Por que o Tempo Importa"
    Alguns sites carregam o captcha assincronamente. Se o shadow root do Cloudflare não aparecer dentro de `time_to_wait_captcha`, a interação é pulada.

## Outros Sistemas de Captcha

### reCAPTCHA v3 (Invisível)

O reCAPTCHA v3 é **completamente invisível** e **não requer interação**. Apenas navegue normalmente:

```python
async def recaptcha_v3_example():
    options = ChromiumOptions()
    options.add_argument('--disable-blink-features=AutomationControlled')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Nenhum tratamento especial necessário - apenas navegue
        await tab.go_to('https://site-with-recaptcha-v3.com')
        
        # reCAPTCHA v3 roda em segundo plano, analisando seu comportamento
        await asyncio.sleep(3)
        
        # Continue com o envio do formulário
        submit_button = await tab.find(id='submit-btn')
        await submit_button.click()

asyncio.run(recaptcha_v3_example())
```

!!! note "Fatores de Sucesso do reCAPTCHA v3"
    Como o reCAPTCHA v3 é inteiramente passivo (sem interação), o sucesso depende de:
    
    - **Reputação do IP**: Use proxies residenciais com boa reputação
    - **Fingerprint do Navegador**: Configure preferências de navegador realistas
    - **Padrões Comportamentais**: Passe tempo na página, role naturalmente, digite realisticamente
    
    Se sua pontuação for muito baixa, alguns sites podem mostrar um desafio reCAPTCHA v2 (que o Pydoll **não pode resolver**).

## O que Determina o Sucesso?

O sucesso da interação com o captcha depende **inteiramente do seu ambiente**, não do Pydoll. O sistema de captcha analisa:

### 1. Reputação do IP (Mais Crítico)

| Tipo de IP | Nível de Confiança | Comportamento Esperado |
|---|---|---|
| **IP Residencial (limpo)** | Alto | Geralmente aceito sem desafios |
| **IP Móvel** | Alto | Geralmente aceito sem desafios |
| **IP de Datacenter** | Baixo | Frequentemente bloqueado ou desafiado |
| **IP previamente bloqueado** | Muito Baixo | Quase sempre bloqueado ou desafiado |

!!! danger "Reputação do IP é Tudo"
    **Nenhuma ferramenta pode superar um endereço IP ruim.** Se seu IP estiver sinalizado, você será bloqueado ou desafiado, independentemente de quão realista seu navegador pareça.
    
    Use proxies residenciais com boa reputação para melhores resultados.

### 2. Fingerprint do Navegador

Configure seu navegador para parecer legítimo:

```python
import time
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def stealth_configuration():
    options = ChromiumOptions()
    
    # Argumentos de furtividade
    options.add_argument('--disable-blink-features=AutomationControlled')
    options.add_argument('--window-size=1920,1080')
    
    # Preferências de navegador realistas
    current_time = int(time.time())
    options.browser_preferences = {
        'profile': {
            'last_engagement_time': str(current_time - (3 * 60 * 60)),  # 3 horas atrás
            'exited_cleanly': True,
            'exit_type': 'Normal',
        },
        'safebrowsing': {'enabled': True},
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        async with tab.expect_and_bypass_cloudflare_captcha():
            await tab.go_to('https://site-with-turnstile.com')

asyncio.run(stealth_configuration())
```

### 3. Padrões Comportamentais

Sistemas de captcha analisam como você interage com a página:

```python
async def realistic_behavior():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://site-with-turnstile.com')
        
        # Simular comportamento humano antes do captcha aparecer
        await asyncio.sleep(2)  # Ler conteúdo da página
        await tab.execute_script('window.scrollBy(0, 300)')  # Rolar
        await asyncio.sleep(1)
        
        # Agora interagir com o captcha
        async with tab.expect_and_bypass_cloudflare_captcha():
            # A interação com o captcha acontece aqui
            pass
        
        print("Captcha passado com comportamento realista!")

asyncio.run(realistic_behavior())
```

!!! tip "Fingerprinting Comportamental"
    Para um entendimento aprofundado de como os padrões comportamentais afetam o sucesso do captcha, veja **[Fingerprinting Comportamental](../../deep-dive/fingerprinting/behavioral-fingerprinting.md)**. Este guia explica:
    
    - Padrões de movimento do mouse e detecção
    - Análise de tempo de pressionamento de teclas
    - Física do comportamento de rolagem
    - Análise de sequência de eventos
    
    Entender esses conceitos pode ajudá-lo a construir uma automação mais realista que alcança taxas de sucesso mais altas.

## Solução de Problemas

### Captcha Não Está Sendo Clicado

**Sintomas**: O captcha aparece, mas nunca é clicado, a página permanece no desafio.

**Causas Possíveis:**

1.  **Tempo muito curto**: O captcha ainda não carregou quando o Pydoll tenta clicar
2.  **Shadow root não encontrado**: O shadow root do Cloudflare Turnstile ainda não apareceu no DOM

**Soluções:**

```python
async def troubleshooting_example():
    async with Chrome() as browser:
        tab = await browser.start()

        # Aumentar tempos de espera
        async with tab.expect_and_bypass_cloudflare_captcha(
            time_before_click=5,     # Atraso maior antes de clicar
            time_to_wait_captcha=15  # Mais tempo para encontrar o captcha
        ):
            await tab.go_to('https://problematic-site.com')

asyncio.run(troubleshooting_example())
```

### Captcha Clicado, mas Mostra Desafio

**Sintomas**: A caixa de seleção mostra a marca de verificação brevemente, depois apresenta um desafio de imagem/quebra-cabeça.

**Causa Raiz**: A pontuação de confiança do seu ambiente está muito baixa.

**Soluções:**

- Use proxies residenciais com boa reputação
- Configure um fingerprint de navegador realista
- Adicione padrões comportamentais mais realistas (rolagem, movimento do mouse, atrasos)
- **Nota**: O Pydoll não pode resolver o desafio em si. Se você precisa de resolução automática de captchas, considere integrar com o **[CapSolver](https://dashboard.capsolver.com/passport/register?inviteCode=WPhTbOsbXEpc)**

### "Acesso Negado" ou Bloqueio Imediato

**Sintomas**: O site mostra imediatamente "Acesso Negado" ou bloqueia você sem mostrar o captcha.

**Causa Raiz**: **Seu endereço IP está sinalizado.**

**Soluções:**

- Use um proxy residencial diferente com boa reputação
- Rotacione IPs entre as requisições
- Teste seu IP em `https://www.cloudflare.com/cdn-cgi/trace`
- **Nota**: Nenhuma configuração de navegador corrigirá um IP sinalizado

### Funciona Localmente, mas Falha no Docker/CI

**Sintomas**: A interação com o captcha funciona na sua máquina, mas falha em ambientes Docker/CI.

**Causa Raiz**: IPs de datacenter são examinados de perto pelos sistemas de captcha.

**Soluções:**

1.  **Use o modo headless com exibição adequada** (para renderização completa):
    ```dockerfile
    FROM python:3.11-slim
   
    RUN apt-get update && apt-get install -y \
        chromium \
        chromium-driver \
        xvfb \
        && rm -rf /var/lib/apt/lists/*
   
    ENV DISPLAY=:99
   
    CMD Xvfb :99 -screen 0 1920x1080x24 & python your_script.py
    ```

2.  **Use proxy residencial** mesmo em CI/CD:
    ```python
    options = ChromiumOptions()
    options.add_argument('--proxy-server=http://user:pass@residential-proxy.com:8080')
    ```

## Melhores Práticas

1.  **Use proxies residenciais**: A reputação do IP é o fator mais crítico
2.  **Configure opções de furtividade**: Remova indicadores de automação
3.  **Adicione padrões comportamentais**: Role, espere, mova o mouse antes de clicar
4.  **Ajuste o tempo**: Dê tempo ao captcha para carregar antes de tentar clicar
5.  **Lide com falhas graciosamente**: Tenha lógica de fallback para quando o captcha não puder ser passado
6.  **Teste seu ambiente**: Verifique a reputação do IP e o fingerprint do navegador antes da automação

## Diretrizes Éticas

!!! danger "Termos de Serviço e Conformidade Legal"
    Interagir com captchas pode violar os Termos de Serviço de um site, mesmo que tecnicamente possível. **Sempre verifique e respeite os ToS** antes de automatizar qualquer site.
    
    Esta funcionalidade é fornecida **apenas para fins legítimos de automação**:
    
    **Casos de uso apropriados:**
    - Teste automatizado de suas próprias aplicações
    - Serviços de monitoramento que você tem permissão para monitorar
    - Pesquisa e análise de segurança com autorização adequada
    
    **Casos de uso inapropriados:**
    - Raspagem de conteúdo que você não tem permissão para acessar
    - Contornar paywalls ou sistemas de assinatura
    - Ataques de negação de serviço (Denial-of-Service) ou raspagem agressiva
    - Qualquer atividade que viole os Termos de Serviço

## Veja Também

- **[Opções do Navegador](../configuration/browser-options.md)** - Configuração de furtividade
- **[Preferências do Navegador](../configuration/browser-preferences.md)** - Fingerprinting avançado
- **[Configuração de Proxy](../configuration/proxy.md)** - Configurando proxies
- **[Fingerprinting Comportamental](../../deep-dive/fingerprinting/behavioral-fingerprinting.md)** - Entendendo a detecção comportamental
- **[Interações Semelhantes a Humanas](../automation/human-interactions.md)** - Padrões de comportamento realistas

---

**Lembre-se**: O Pydoll fornece o mecanismo para clicar em captchas, mas seu ambiente (IP, fingerprint, comportamento) determina o sucesso. Esta não é uma solução mágica, é uma ferramenta que funciona quando usada no ambiente certo com a configuração adequada.

================================================
FILE: docs/pt/features/advanced/decorators.md
================================================
# Decorator Retry

Web scraping é inerentemente imprevisível. Redes falham, páginas carregam lentamente, elementos aparecem e desaparecem, limites de taxa entram em ação e CAPTCHAs surgem inesperadamente. O decorator `@retry` fornece uma solução robusta e testada em produção para lidar com essas falhas inevitáveis de forma elegante.

## Por Que Usar o Decorator Retry?

No scraping em produção, falhas não são exceções—são a norma. Em vez de deixar todo o seu trabalho de scraping travar por causa de uma falha temporária de rede ou um elemento ausente, o decorator retry permite que você:

- **Recupere-se automaticamente** de falhas transitórias
- **Implemente estratégias sofisticadas de retry** com backoff exponencial
- **Execute lógica de recuperação** antes de tentar novamente (atualizar página, trocar proxy, reiniciar navegador)
- **Mantenha sua lógica de negócio limpa** sem poluí-la com código de tratamento de erros

## Início Rápido

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.decorators import retry
from pydoll.exceptions import WaitElementTimeout, NetworkError

@retry(max_retries=3, exceptions=[WaitElementTimeout, NetworkError])
async def scrape_product_page(url: str):
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to(url)
        
        # Isso pode falhar devido a problemas de rede ou carregamento lento
        product_title = await tab.find(class_name='product-title', timeout=5)
        return await product_title.text

asyncio.run(scrape_product_page('https://example.com/product/123'))
```

Se `scrape_product_page` falhar com `WaitElementTimeout` ou `NetworkError`, ela automaticamente tentará novamente até 3 vezes antes de desistir.

## Boa Prática: Sempre Especifique Exceções

!!! warning "Boa Prática Crítica"
    **SEMPRE** especifique quais exceções devem acionar um retry. Usar o padrão `exceptions=Exception` vai capturar **tudo**, incluindo bugs no seu código que deveriam falhar imediatamente.

**Ruim (captura tudo, incluindo bugs):**

```python
@retry(max_retries=3)  # NÃO FAÇA ISSO
async def scrape_data():
    data = response['items'][0]  # Se 'items' não existir, retries não vão ajudar!
    return data
```

**Bom (só tenta novamente em falhas esperadas):**

```python
from pydoll.exceptions import ElementNotFound, WaitElementTimeout, NetworkError

@retry(
    max_retries=3,
    exceptions=[ElementNotFound, WaitElementTimeout, NetworkError]
)
async def scrape_data():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        return await tab.find(id='data-container', timeout=10)
```

Ao especificar exceções, você garante que:

- **Erros de lógica falham rapidamente** (typos, seletores errados, bugs de código)
- **Apenas erros recuperáveis são retentados** (problemas de rede, timeouts, elementos ausentes)
- **Depuração é mais fácil** (você sabe exatamente o que deu errado)

## Parâmetros

### max_retries

Número máximo de tentativas de retry antes de desistir.

```python
from pydoll.exceptions import WaitElementTimeout

@retry(max_retries=5, exceptions=[WaitElementTimeout])
async def fetch_data():
    # Tentará até 5 vezes no total
    pass
```

### exceptions

Tipos de exceção que devem acionar um retry. Pode ser uma única exceção ou uma lista.

```python
from pydoll.exceptions import (
    ElementNotFound,
    WaitElementTimeout,
    NetworkError,
    ElementNotInteractable
)

# Exceção única
@retry(exceptions=[WaitElementTimeout])
async def example1():
    pass

# Múltiplas exceções
@retry(exceptions=[WaitElementTimeout, NetworkError, ElementNotFound, ElementNotInteractable])
async def example2():
    pass
```

!!! tip "Exceções Comuns de Scraping"
    Para web scraping com Pydoll, você normalmente vai querer retry em:

    - `WaitElementTimeout` - Timeout esperando elemento aparecer
    - `ElementNotFound` - Elemento não existe no DOM
    - `ElementNotVisible` - Elemento existe mas não está visível
    - `ElementNotInteractable` - Elemento não pode receber interação
    - `NetworkError` - Problemas de conectividade de rede
    - `ConnectionFailed` - Falha ao conectar ao navegador
    - `PageLoadTimeout` - Timeout no carregamento de página
    - `ClickIntercepted` - Click interceptado por outro elemento

### delay

Tempo de espera entre tentativas de retry (em segundos).

```python
from pydoll.exceptions import WaitElementTimeout

@retry(max_retries=3, exceptions=[WaitElementTimeout], delay=2.0)
async def scrape_with_delay():
    # Espera 2 segundos entre cada retry
    pass
```

### exponential_backoff

Quando `True`, aumenta o delay exponencialmente com cada tentativa de retry.

```python
from pydoll.exceptions import NetworkError

@retry(
    max_retries=5,
    exceptions=[NetworkError],
    delay=1.0,
    exponential_backoff=True
)
async def scrape_with_backoff():
    # Tentativa 1: falha → espera 1 segundo
    # Tentativa 2: falha → espera 2 segundos
    # Tentativa 3: falha → espera 4 segundos
    # Tentativa 4: falha → espera 8 segundos
    # Tentativa 5: falha → lança exceção
    pass
```

**O que é Exponential Backoff?**

Exponential backoff é uma estratégia de retry onde o tempo de espera entre tentativas aumenta exponencialmente. Em vez de bombardear um servidor com requisições a cada segundo, você dá progressivamente mais tempo para ele se recuperar:

- **Tentativa 1**: Espera `delay` segundos (ex: 1s)
- **Tentativa 2**: Espera `delay * 2` segundos (ex: 2s)
- **Tentativa 3**: Espera `delay * 4` segundos (ex: 4s)
- **Tentativa 4**: Espera `delay * 8` segundos (ex: 8s)

Isso é especialmente útil quando:

- Lidando com **limites de taxa** (dê tempo ao servidor para resetar)
- Lidando com **sobrecarga temporária do servidor** (não piore a situação)
- Esperando **conteúdo dinâmico de carregamento lento**
- Evitando **detecção como bot** (padrões de retry com aparência natural)

### on_retry

Uma função callback executada após cada tentativa falhada, antes do próximo retry. Deve ser uma **função async**.

```python
from pydoll.exceptions import WaitElementTimeout

@retry(
    max_retries=3,
    exceptions=[WaitElementTimeout],
    on_retry=my_recovery_function
)
async def scrape_data():
    pass
```

O callback pode ser:

- **Uma função async standalone**
- **Um método de classe** (recebe `self` automaticamente)

## O Callback on_retry: Seu Mecanismo de Recuperação

O callback `on_retry` é onde a verdadeira mágica acontece. Esta é sua oportunidade de **restaurar o estado da aplicação** antes da próxima tentativa de retry.

### Função Standalone

```python
import asyncio
from pydoll.decorators import retry
from pydoll.exceptions import WaitElementTimeout

async def log_retry():
    print("Tentativa de retry falhou, esperando antes da próxima tentativa...")
    await asyncio.sleep(1)

@retry(max_retries=3, exceptions=[WaitElementTimeout], on_retry=log_retry)
async def scrape_page():
    # Sua lógica de scraping
    pass
```

### Método de Classe

Ao usar o decorator dentro de uma classe, o callback pode ser um método de classe. Ele receberá automaticamente `self` como primeiro argumento.

```python
import asyncio
from pydoll.decorators import retry
from pydoll.exceptions import WaitElementTimeout

class DataCollector:
    def __init__(self):
        self.retry_count = 0
    
    # IMPORTANTE: Defina o callback ANTES do método decorado
    async def log_retry(self):
        self.retry_count += 1
        print(f"Tentativa {self.retry_count} falhou, tentando novamente...")
        await asyncio.sleep(1)
    
    @retry(
        max_retries=3,
        exceptions=[WaitElementTimeout],
        on_retry=log_retry  # Sem prefixo 'self.' necessário
    )
    async def fetch_data(self):
        # Sua lógica de scraping aqui
        pass
```

!!! warning "Ordem de Definição de Métodos Importa"
    Ao usar `on_retry` com métodos de classe, **você deve definir o método callback ANTES do método decorado** na definição da sua classe. Python precisa saber sobre o callback quando o decorator é aplicado.

    **Errado (vai falhar):**

    ```python
    class Scraper:
        @retry(on_retry=handle_retry)  # handle_retry ainda não existe!
        async def scrape(self):
            pass
        
        async def handle_retry(self):  # Definido muito tarde
            pass
    ```

    **Correto:**

    ```python
    class Scraper:
        async def handle_retry(self):  # Definido primeiro
            pass
        
        @retry(on_retry=handle_retry)  # Agora existe
        async def scrape(self):
            pass
    ```

## Casos de Uso do Mundo Real

### 1. Atualização de Página e Recuperação de Estado

**Este é o uso mais poderoso do `on_retry`**: recuperar de falhas atualizando a página e restaurando o estado da sua aplicação. Este exemplo demonstra por que o decorator retry é tão valioso para scraping em produção.

```python
from pydoll.browser.chromium import Chrome
from pydoll.decorators import retry
from pydoll.exceptions import ElementNotFound, WaitElementTimeout
from pydoll.constants import Key
import asyncio

class DataScraper:
    def __init__(self):
        self.browser = None
        self.tab = None
        self.current_page = 1
    
    async def recover_from_failure(self):
        """Atualizar página e restaurar estado antes do retry"""
        print(f"Recuperando... atualizando página {self.current_page}")
        
        if self.tab:
            # Atualiza a página para recuperar de elementos obsoletos ou estado ruim
            await self.tab.refresh()
            await asyncio.sleep(2)  # Esperar a página carregar
            
            # Restaurar estado: navegar de volta para a página correta
            if self.current_page > 1:
                page_input = await self.tab.find(id='page-number')
                await page_input.insert_text(str(self.current_page))
                await self.tab.keyboard.press(Key.ENTER)
                await asyncio.sleep(1)
    
    @retry(
        max_retries=3,
        exceptions=[ElementNotFound, WaitElementTimeout],
        on_retry=recover_from_failure,
        delay=1.0
    )
    async def scrape_page_data(self):
        """Fazer scraping dos dados da página atual"""
        if not self.browser:
            self.browser = Chrome()
            self.tab = await self.browser.start()
            await self.tab.go_to('https://example.com/data')
        
        # Navegar para página específica
        page_input = await self.tab.find(id='page-number')
        await page_input.insert_text(str(self.current_page))
        await self.tab.keyboard.press(Key.ENTER)
        await asyncio.sleep(1)
        
        # Fazer scraping dos dados (pode falhar se elementos ficarem obsoletos)
        items = await self.tab.find(class_name='data-item', find_all=True)
        return [await item.text for item in items]
    
    async def scrape_multiple_pages(self, start_page: int, end_page: int):
        """Fazer scraping de múltiplas páginas com retry automático em falhas"""
        results = []
        for page_num in range(start_page, end_page + 1):
            self.current_page = page_num
            data = await self.scrape_page_data()
            results.extend(data)
        return results

# Uso
async def main():
    scraper = DataScraper()
    try:
        # Fazer scraping das páginas 1-10 com recuperação automática em falhas
        all_data = await scraper.scrape_multiple_pages(1, 10)
        print(f"Coletados {len(all_data)} itens")
    finally:
        if scraper.browser:
            await scraper.browser.stop()
```

**O que torna isso poderoso:**

- `recover_from_failure()` realmente **restaura o estado** atualizando e navegando de volta
- O método `scrape_page_data()` fica limpo, focado apenas na lógica de scraping
- Se elementos ficarem obsoletos ou desaparecerem, o mecanismo de retry lida com a recuperação automaticamente
- O navegador persiste entre as tentativas via `self.browser` e `self.tab`

### 2. Recuperação de Modal de Diálogo

Às vezes um modal ou overlay aparece inesperadamente e bloqueia sua automação. Feche-o e tente novamente.

```python
from pydoll.browser.chromium import Chrome
from pydoll.decorators import retry
from pydoll.exceptions import ElementNotFound

class ModalAwareScraper:
    def __init__(self):
        self.tab = None
    
    async def close_modals(self):
        """Fechar quaisquer modals bloqueadores antes do retry"""
        print("Verificando modals bloqueadores...")
        
        # Tentar encontrar e fechar modals comuns
        modal_close = await self.tab.find(
            class_name='modal-close',
            timeout=2,
            raise_exc=False
        )
        if modal_close:
            print("Modal encontrado, fechando...")
            await modal_close.click()
            await asyncio.sleep(0.5)
    
    @retry(
        max_retries=3,
        exceptions=[ElementNotFound],
        on_retry=close_modals,
        delay=0.5
    )
    async def click_button(self, button_id: str):
        button = await self.tab.find(id=button_id)
        await button.click()
```

### 3. Reinício de Navegador e Rotação de Proxy

Para trabalhos pesados de scraping, você pode precisar reiniciar completamente o navegador e trocar proxies após falhas.

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions
from pydoll.decorators import retry
from pydoll.exceptions import NetworkError, PageLoadTimeout

class RobustScraper:
    def __init__(self):
        self.browser = None
        self.tab = None
        self.proxy_list = [
            'proxy1.example.com:8080',
            'proxy2.example.com:8080',
            'proxy3.example.com:8080',
        ]
        self.current_proxy_index = 0
    
    async def restart_with_new_proxy(self):
        """Reiniciar navegador com um proxy diferente"""
        print("Reiniciando navegador com novo proxy...")
        
        # Fechar navegador atual
        if self.browser:
            await self.browser.stop()
            await asyncio.sleep(2)
        
        # Rotacionar para o próximo proxy
        self.current_proxy_index = (self.current_proxy_index + 1) % len(self.proxy_list)
        proxy = self.proxy_list[self.current_proxy_index]
        
        print(f"Usando proxy: {proxy}")
        
        # Iniciar novo navegador com novo proxy
        options = ChromiumOptions()
        options.add_argument(f'--proxy-server={proxy}')
        
        self.browser = Chrome(options=options)
        self.tab = await self.browser.start()
    
    @retry(
        max_retries=3,
        exceptions=[NetworkError, PageLoadTimeout],
        on_retry=restart_with_new_proxy,
        delay=5.0,
        exponential_backoff=True
    )
    async def scrape_protected_site(self, url: str):
        if not self.browser:
            await self.restart_with_new_proxy()
        
        await self.tab.go_to(url)
        await asyncio.sleep(3)
        
        # Sua lógica de scraping aqui
        content = await self.tab.find(id='content')
        return await content.text
```

### 4. Detecção de Ociosidade da Rede com Retry

Esperar que toda atividade de rede seja concluída, com lógica de retry se a página nunca estabilizar.

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.decorators import retry
from pydoll.exceptions import TimeoutException

class NetworkAwareScraper:
    def __init__(self):
        self.tab = None
    
    async def reload_page(self):
        """Recarregar página se a rede nunca estabilizou"""
        print("Página não estabilizou, recarregando...")
        if self.tab:
            await self.tab.refresh()
            await asyncio.sleep(2)
    
    @retry(
        max_retries=2,
        exceptions=[TimeoutException],
        on_retry=reload_page,
        delay=3.0
    )
    async def wait_for_page_ready(self):
        """Esperar todas as requisições de rede completarem"""
        await self.tab.enable_network_events()
        
        # Esperar rede ociosa (sem requisições por 2 segundos)
        idle_time = 0
        max_wait = 10
        
        while idle_time < max_wait:
            # Verificar se há requisições em andamento
            # (Implementação depende do seu rastreamento de eventos)
            await asyncio.sleep(0.5)
            idle_time += 0.5
        
        if idle_time >= max_wait:
            raise TimeoutException("Rede nunca estabilizou")
```

### 5. Detecção e Recuperação de CAPTCHA

Detectar quando um CAPTCHA aparece e tomar a ação apropriada.

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.decorators import retry
from pydoll.exceptions import ElementNotFound

class CaptchaScraper:
    def __init__(self):
        self.tab = None
        self.captcha_count = 0
    
    async def handle_captcha(self):
        """Lidar com CAPTCHA esperando ou mudando estratégia"""
        self.captcha_count += 1
        print(f"CAPTCHA detectado (contagem: {self.captcha_count})")
        
        if self.captcha_count > 2:
            print("Muitos CAPTCHAs, pode precisar mudar estratégia...")
            # Poderia mudar para uma abordagem diferente aqui
        
        # Esperar mais tempo entre tentativas
        await asyncio.sleep(30)
        
        # Atualizar a página
        await self.tab.refresh()
        await asyncio.sleep(5)
    
    @retry(
        max_retries=3,
        exceptions=[ElementNotFound],
        on_retry=handle_captcha,
        delay=10.0,
        exponential_backoff=True
    )
    async def scrape_protected_content(self, url: str):
        if not self.tab:
            browser = Chrome()
            self.tab = await browser.start()
        
        await self.tab.go_to(url)
        
        # Verificar CAPTCHA
        captcha = await self.tab.find(
            class_name='g-recaptcha',
            timeout=2,
            raise_exc=False
        )
        
        if captcha:
            raise ElementNotFound("CAPTCHA detectado")
        
        # Lógica de scraping normal
        content = await self.tab.find(class_name='article-content')
        return await content.text
```

## Padrões Avançados

### Combinando Múltiplas Estratégias de Recuperação

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.decorators import retry
from pydoll.exceptions import ElementNotFound, WaitElementTimeout, NetworkError

class AdvancedScraper:
    def __init__(self):
        self.tab = None
        self.attempt = 0
        self.strategies = [
            self.strategy_refresh,
            self.strategy_clear_cache,
            self.strategy_restart_browser,
        ]
    
    async def strategy_refresh(self):
        """Estratégia 1: Atualização simples"""
        print("Estratégia 1: Atualizando página")
        await self.tab.refresh()
        await asyncio.sleep(2)
    
    async def strategy_clear_cache(self):
        """Estratégia 2: Limpar cache e atualizar"""
        print("Estratégia 2: Limpando cache")
        await self.tab.execute_command('Network.clearBrowserCache')
        await self.tab.refresh()
        await asyncio.sleep(3)
    
    async def strategy_restart_browser(self):
        """Estratégia 3: Reinício completo do navegador"""
        print("Estratégia 3: Reiniciando navegador")
        if self.tab:
            await self.tab._browser.stop()
        
        browser = Chrome()
        self.tab = await browser.start()
    
    async def adaptive_recovery(self):
        """Tentar diferentes estratégias de recuperação baseado no número da tentativa"""
        strategy_index = min(self.attempt, len(self.strategies) - 1)
        strategy = self.strategies[strategy_index]
        
        print(f"Tentativa {self.attempt + 1}: Usando {strategy.__name__}")
        await strategy()
        
        self.attempt += 1
    
    @retry(
        max_retries=3,
        exceptions=[ElementNotFound, WaitElementTimeout, NetworkError],
        on_retry=adaptive_recovery,
        delay=2.0
    )
    async def scrape_with_adaptive_retry(self, url: str):
        await self.tab.go_to(url)
        return await self.tab.find(id='target-content')
```

### Exceção Customizada para Falha Específica

```python
import asyncio
from pydoll.decorators import retry
from pydoll.exceptions import PydollException

class RateLimitError(PydollException):
    """Lançado quando limite de taxa é detectado"""
    message = "Limite de taxa da API excedido"

class APIScraper:
    async def wait_for_rate_limit_reset(self):
        """Esperar mais quando limitado por taxa"""
        print("Limite de taxa detectado, esperando 60 segundos...")
        await asyncio.sleep(60)
    
    @retry(
        max_retries=5,
        exceptions=[RateLimitError],
        on_retry=wait_for_rate_limit_reset,
        delay=10.0,
        exponential_backoff=True
    )
    async def fetch_api_data(self, endpoint: str):
        response = await self.tab.request.get(endpoint)
        
        if response.status == 429:  # Too Many Requests
            raise RateLimitError("Limite de taxa da API excedido")
        
        return response.json()
```

## Resumo de Melhores Práticas

1. **Sempre especifique exceções explicitamente** - Nunca use o padrão `exceptions=Exception`
2. **Use exponential backoff para serviços externos** - Dê tempo aos servidores para se recuperarem
3. **Mantenha contagens de retry razoáveis** - Geralmente 3-5 tentativas são suficientes
4. **Registre tentativas de retry** - Use `on_retry` para registrar o que está acontecendo
5. **Defina callbacks antes dos métodos decorados** - Ordem importa em definições de classe
6. **Faça callbacks async** - O decorator requer callbacks async
7. **Restaure estado nos callbacks** - Use `on_retry` para navegar de volta para onde você estava
8. **Considere o custo dos retries** - Cada retry consome tempo e recursos
9. **Combine com outros tratamentos de erro** - Retries não substituem blocos try/except
10. **Teste sua lógica de retry** - Certifique-se de que callbacks de recuperação realmente funcionam

## Saiba Mais

- **[Tratamento de Exceções](../core-concepts.md#error-handling)** - Entendendo exceções do Pydoll
- **[Eventos de Rede](../network/monitoring.md)** - Rastrear e lidar com falhas de rede
- **[Opções do Navegador](../configuration/browser-options.md)** - Configurar proxies e outras configurações
- **[Sistema de Eventos](event-system.md)** - Construir estratégias de retry reativas

O decorator retry é uma ferramenta poderosa que transforma scripts de scraping frágeis em aplicações prontas para produção. Ao combiná-lo com estratégias de recuperação bem pensadas, você pode construir scrapers que lidam graciosamente com o caos da web real.


================================================
FILE: docs/pt/features/advanced/event-system.md
================================================
# Sistema de Eventos

O sistema de eventos do Pydoll permite que você ouça e reaja às atividades do navegador em tempo real. Isso é essencial para construir automações dinâmicas, monitorar requisições de rede, detectar mudanças na página e criar fluxos de trabalho reativos.

!!! info "Análise Profunda Disponível"
    Este guia foca no uso prático. Para detalhes arquitetônicos e implementação interna, veja a [Análise Profunda da Arquitetura de Eventos](../../deep-dive/event-architecture.md).

## Pré-requisitos

Antes de trabalhar com eventos, você precisa habilitar o domínio CDP correspondente:

```python
from pydoll.browser.chromium import Chrome

async with Chrome() as browser:
    tab = await browser.start()
    
    # Habilite o domínio antes de ouvir os eventos
    await tab.enable_page_events()     # Para eventos de ciclo de vida da página
    await tab.enable_network_events()  # Para atividade de rede
    await tab.enable_dom_events()      # Para mudanças no DOM
```

!!! warning "Eventos Não Serão Disparados Sem Habilitar"
    Se você registrar um callback mas esquecer de habilitar o domínio, seu callback nunca será acionado. Sempre habilite o domínio primeiro!

## Audição Básica de Eventos

O método `on()` registra ouvintes de eventos:

```python
from pydoll.protocol.page.events import PageEvent, LoadEventFiredEvent

async def handle_page_load(event: LoadEventFiredEvent):
    print(f"Página carregada em {event['params']['timestamp']}")

# Registrar o callback
await tab.enable_page_events()
callback_id = await tab.on(PageEvent.LOAD_EVENT_FIRED, handle_page_load)
```

### Estrutura do Evento

Todos os eventos seguem a mesma estrutura:

```python
{
    'method': 'Page.loadEventFired',  # Nome do evento
    'params': {                        # Dados específicos do evento
        'timestamp': 123456.789
    }
}
```

Acesse os dados do evento através de `event['params']`:

```python
from pydoll.protocol.network.events import RequestWillBeSentEvent

async def handle_request(event: RequestWillBeSentEvent):
    url = event['params']['request']['url']
    method = event['params']['request']['method']
    print(f"{method} {url}")
```

### Usando Dicas de Tipo (Type Hints) para Melhor Suporte da IDE

Use dicas de tipo com os tipos de parâmetros de evento para obter autocompletar para as chaves do evento:

```python
from pydoll.protocol.network.events import NetworkEvent, RequestWillBeSentEvent
from pydoll.protocol.page.events import PageEvent, LoadEventFiredEvent

# Com dicas de tipo - a IDE conhece todas as chaves disponíveis!
async def handle_request(event: RequestWillBeSentEvent):
    # A IDE irá autocompletar 'params', 'request', 'url', etc.
    url = event['params']['request']['url']
    method = event['params']['request']['method']
    timestamp = event['params']['timestamp']
    print(f"{method} {url} em {timestamp}")

async def handle_load(event: LoadEventFiredEvent):
    # A IDE sabe que este evento tem 'timestamp' em params
    timestamp = event['params']['timestamp']
    print(f"Página carregada em {timestamp}")

await tab.enable_network_events()
await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, handle_request)

await tab.enable_page_events()
await tab.on(PageEvent.LOAD_EVENT_FIRED, handle_load)
```

!!! tip "Dicas de Tipo para Parâmetros de Evento"
    Todos os tipos de evento são definidos em `pydoll.protocol.<domain>.events`. Usá-los oferece a você:
    
    - **Autocompletar**: A IDE sugere chaves disponíveis em `event['params']`
    - **Segurança de tipo**: Pega erros de digitação antes de rodar o código
    - **Documentação**: Veja quais dados cada evento fornece
    
    Os tipos de evento seguem o padrão: `<EventName>Event` (ex: `RequestWillBeSentEvent`, `ResponseReceivedEvent`)

## Domínios de Eventos Comuns

### Eventos de Página (Page)

Monitore o ciclo de vida da página e diálogos:

```python
from pydoll.protocol.page.events import PageEvent, JavascriptDialogOpeningEvent

await tab.enable_page_events()

# Página carregada
await tab.on(PageEvent.LOAD_EVENT_FIRED, lambda e: print("Página carregada!"))

# DOM pronto
await tab.on(PageEvent.DOM_CONTENT_EVENT_FIRED, lambda e: print("DOM pronto!"))

# Diálogo JavaScript
async def handle_dialog(event: JavascriptDialogOpeningEvent):
    message = event['params']['message']
    dialog_type = event['params']['type']
    print(f"Diálogo ({dialog_type}): {message}")
    
    # Lidar com isso automaticamente
    if await tab.has_dialog():
        await tab.handle_dialog(accept=True)

await tab.on(PageEvent.JAVASCRIPT_DIALOG_OPENING, handle_dialog)
```

### Eventos de Rede (Network)

Monitore requisições e respostas:

```python
from pydoll.protocol.network.events import (
    NetworkEvent,
    RequestWillBeSentEvent,
    ResponseReceivedEvent,
    LoadingFailedEvent
)

await tab.enable_network_events()

# Rastrear requisições
async def log_request(event: RequestWillBeSentEvent):
    request = event['params']['request']
    print(f"→ {request['method']} {request['url']}")

await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, log_request)

# Rastrear respostas
async def log_response(event: ResponseReceivedEvent):
    response = event['params']['response']
    print(f"← {response['status']} {response['url']}")

await tab.on(NetworkEvent.RESPONSE_RECEIVED, log_response)

# Rastrear falhas
async def log_failure(event: LoadingFailedEvent):
    url = event['params']['type']
    error = event['params']['errorText']
    print(f"[FALHOU] {url} - {error}")

await tab.on(NetworkEvent.LOADING_FAILED, log_failure)
```

### Eventos DOM

Reaja a mudanças no DOM:

```python
from pydoll.protocol.dom.events import DomEvent, AttributeModifiedEvent

await tab.enable_dom_events()

# Rastrear mudanças de atributo
async def on_attribute_change(event: AttributeModifiedEvent):
    node_id = event['params']['nodeId']
    attr_name = event['params']['name']
    attr_value = event['params']['value']
    print(f"Nó {node_id}: {attr_name}={attr_value}")

await tab.on(DomEvent.ATTRIBUTE_MODIFIED, on_attribute_change)

# Rastrear atualizações do documento
await tab.on(DomEvent.DOCUMENT_UPDATED, lambda e: print("Documento atualizado!"))
```

## Callbacks Temporários

Use `temporary=True` para ouvintes de uma única vez:

```python
from pydoll.protocol.page.events import PageEvent

# Isso disparará apenas uma vez e depois se auto-removerá
await tab.on(
    PageEvent.LOAD_EVENT_FIRED,
    lambda e: print("Primeiro carregamento!"),
    temporary=True
)

await tab.go_to("https://example.com")  # Dispara o callback
await tab.refresh()                      # Callback não disparará novamente
```

!!! tip "Perfeito para Configuração Única"
    Callbacks temporários são ideais para tarefas de inicialização que devem acontecer apenas uma vez.

## Acessando a Aba (Tab) nos Callbacks

Use `functools.partial` para passar a aba para seus callbacks:

```python
from functools import partial
from pydoll.protocol.network.events import NetworkEvent, ResponseReceivedEvent

async def process_response(tab, event: ResponseReceivedEvent):
    # Agora podemos usar o objeto tab!
    request_id = event['params']['requestId']
    
    # Obter corpo da resposta
    body = await tab.get_network_response_body(request_id)
    print(f"Corpo da resposta: {body[:100]}...")

await tab.enable_network_events()
await tab.on(
    NetworkEvent.RESPONSE_RECEIVED,
    partial(process_response, tab)
)
```

!!! info "Por que Usar Partial?"
    O sistema de eventos passa apenas os dados do evento para os callbacks. `partial` permite que você vincule parâmetros adicionais, como a instância da aba.

## Gerenciando Callbacks

### Removendo Callbacks

```python
from pydoll.protocol.page.events import PageEvent

# Salvar o ID do callback
callback_id = await tab.on(PageEvent.LOAD_EVENT_FIRED, my_callback)

# Removê-lo mais tarde
await tab.remove_callback(callback_id)
```

### Limpando Todos os Callbacks

```python
# Remover todos os callbacks registrados para esta aba
await tab.clear_callbacks()
```

## Exemplos Práticos

### Monitorar Chamadas de API

```python
import asyncio
from functools import partial
from pydoll.protocol.network.events import NetworkEvent, ResponseReceivedEvent

async def monitor_api_calls(tab):
    collected_data = []
    
    # Dica de tipo ajuda a IDE a autocompletar chaves de evento
    async def capture_api_response(tab, data_list, event: ResponseReceivedEvent):
        url = event['params']['response']['url']
        
        # Filtrar apenas chamadas de API
        if '/api/' not in url:
            return
        
        request_id = event['params']['requestId']
        body = await tab.get_network_response_body(request_id)
        
        data_list.append({
            'url': url,
            'body': body,
            'status': event['params']['response']['status']
        })
        print(f"Capturada chamada de API: {url}")
    
    await tab.enable_network_events()
    await tab.on(
        NetworkEvent.RESPONSE_RECEIVED,
        partial(capture_api_response, tab, collected_data)
    )
    
    # Navegar e coletar
    await tab.go_to("https://example.com")
    await asyncio.sleep(3)  # Esperar requisições completarem
    
    return collected_data
```

### Esperar por Evento Específico

```python
import asyncio
from pydoll.protocol.page.events import PageEvent, FrameNavigatedEvent

async def wait_for_navigation():
    navigation_done = asyncio.Event()
    
    async def on_navigated(event: FrameNavigatedEvent):
        navigation_done.set()
    
    await tab.enable_page_events()
    await tab.on(PageEvent.FRAME_NAVIGATED, on_navigated, temporary=True)
    
    # Disparar navegação
    button = await tab.find(id='next-page')
    await button.click()
    
    # Esperar completar
    await navigation_done.wait()
    print("Navegação concluída!")
```

### Detecção de Ociosidade da Rede (Network Idle)

```python
import asyncio
from pydoll.protocol.network.events import (
    NetworkEvent,
    RequestWillBeSentEvent,
    LoadingFinishedEvent,
    LoadingFailedEvent
)

async def wait_for_network_idle(tab, timeout=5):
    in_flight = 0
    idle_event = asyncio.Event()
    last_activity = asyncio.get_event_loop().time()
    
    async def on_request(event: RequestWillBeSentEvent):
        nonlocal in_flight, last_activity
        in_flight += 1
        last_activity = asyncio.get_event_loop().time()
    
    async def on_finished(event: LoadingFinishedEvent | LoadingFailedEvent):
        nonlocal in_flight, last_activity
        in_flight -= 1
        last_activity = asyncio.get_event_loop().time()
        
        if in_flight == 0:
            idle_event.set()
    
    await tab.enable_network_events()
    req_id = await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, on_request)
    fin_id = await tab.on(NetworkEvent.LOADING_FINISHED, on_finished)
    fail_id = await tab.on(NetworkEvent.LOADING_FAILED, on_finished)
    
    try:
        await asyncio.wait_for(idle_event.wait(), timeout=timeout)
        print("Rede está ociosa!")
    except asyncio.TimeoutError:
        print(f"Rede ainda ativa após {timeout}s")
    finally:
        # Limpeza
        await tab.remove_callback(req_id)
        await tab.remove_callback(fin_id)
        await tab.remove_callback(fail_id)
```

### Raspagem de Conteúdo Dinâmico

```python
import asyncio
import json
from functools import partial
from pydoll.protocol.network.events import NetworkEvent, ResponseReceivedEvent

async def scrape_infinite_scroll(tab, max_items=100):
    items = []
    
    async def capture_products(tab, items_list, event: ResponseReceivedEvent):
        url = event['params']['response']['url']
        
        # Procurar por endpoint de API de produtos
        if '/products' not in url:
            return
        
        request_id = event['params']['requestId']
        body = await tab.get_network_response_body(request_id)
        
        try:
            data = json.loads(body)
            if 'items' in data:
                items_list.extend(data['items'])
                print(f"Coletados {len(data['items'])} itens (total: {len(items_list)})")
        except json.JSONDecodeError:
            pass
    
    await tab.enable_network_events()
    await tab.on(
        NetworkEvent.RESPONSE_RECEIVED,
        partial(capture_products, tab, items)
    )
    
    await tab.go_to("https://example.com/products")
    
    # Rolar para disparar carregamento infinito
    while len(items) < max_items:
        await tab.execute_script("window.scrollTo(0, document.body.scrollHeight)")
        await asyncio.sleep(1)
    
    return items[:max_items]
```

## Tabelas de Referência de Eventos

### Domínios Disponíveis

| Domínio | Método de Habilitação | Casos de Uso Comuns |
|---|---|---|
| Page | `enable_page_events()` | Ciclo de vida da página, navegação, diálogos |
| Network | `enable_network_events()` | Monitoramento de requisição/resposta, rastreamento de API |
| DOM | `enable_dom_events()` | Mudanças na estrutura DOM, modificações de atributos |
| Fetch | `enable_fetch_events()` | Interceptação e modificação de requisições |
| Runtime | `enable_runtime_events()` | Mensagens do console, exceções JavaScript |

### Eventos Chave de Página (Page)

| Evento | Quando Dispara | Caso de Uso |
|---|---|---|
| `LOAD_EVENT_FIRED` | Carregamento da página completo | Esperar pelo carregamento completo da página |
| `DOM_CONTENT_EVENT_FIRED` | DOM pronto | Iniciar manipulação do DOM |
| `JAVASCRIPT_DIALOG_OPENING` | Alert/confirm/prompt | Lidar automaticamente com diálogos |
| `FRAME_NAVIGATED` | Navegação completa | Rastrear navegação de SPA |
| `FILE_CHOOSER_OPENED` | Input de arquivo clicado | Uploads automáticos de arquivos |

### Eventos Chave de Rede (Network)

| Evento | Quando Dispara | Caso de Uso |
|---|---|---|
| `REQUEST_WILL_BE_SENT` | Antes da requisição ser enviada | Registrar/modificar requisições de saída |
| `RESPONSE_RECEIVED` | Cabeçalhos da resposta recebidos | Capturar respostas de API |
| `LOADING_FINISHED` | Corpo da resposta carregado | Obter dados completos da resposta |
| `LOADING_FAILED` | Requisição falhou | Rastrear erros e retentativas |
| `WEB_SOCKET_CREATED` | WebSocket aberto | Monitorar conexões em tempo real |

### Eventos Chave do DOM

| Evento | Quando Dispara | Caso de Uso |
|---|---|---|
| `DOCUMENT_UPDATED` | DOM reconstruído | Atualizar referências de elementos |
| `ATTRIBUTE_MODIFIED` | Atributo do elemento mudou | Rastrear mudanças dinâmicas de atributos |
| `CHILD_NODE_INSERTED` | Novo elemento adicionado | Detectar conteúdo adicionado dinamicamente |
| `CHILD_NODE_REMOVED` | Elemento removido | Detectar conteúdo removido |

### Referência de Tipo de Evento

Todos os tipos de evento e suas estruturas de parâmetros são definidos nos módulos de protocolo:

| Domínio | Caminho de Importação | Tipos de Exemplo |
|---|---|---|
| Page | `pydoll.protocol.page.events` | `LoadEventFiredEvent`, `FrameNavigatedEvent`, `JavascriptDialogOpeningEvent` |
| Network | `pydoll.protocol.network.events` | `RequestWillBeSentEvent`, `ResponseReceivedEvent`, `LoadingFinishedEvent` |
| DOM | `pydoll.protocol.dom.events` | `DocumentUpdatedEvent`, `AttributeModifiedEvent`, `ChildNodeInsertedEvent` |
| Fetch | `pydoll.protocol.fetch.events` | `RequestPausedEvent`, `AuthRequiredEvent` |
| Runtime | `pydoll.protocol.runtime.events` | `ConsoleAPICalledEvent`, `ExceptionThrownEvent` |

Cada tipo de evento é um `TypedDict` que define a estrutura exata do evento, incluindo todas as chaves disponíveis no dicionário `params`.

## Melhores Práticas

### 1. Sempre Habilite os Domínios Primeiro

```python
from pydoll.protocol.network.events import NetworkEvent

# Bom
await tab.enable_network_events()
await tab.on(NetworkEvent.RESPONSE_RECEIVED, callback)

# Ruim: callback nunca será disparado
await tab.on(NetworkEvent.RESPONSE_RECEIVED, callback)
await tab.enable_network_events()
```

### 2. Limpe Quando Terminar

```python
from pydoll.protocol.network.events import NetworkEvent

# Habilitar para tarefa específica
await tab.enable_network_events()
callback_id = await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, log_request)

# Faça seu trabalho...
await tab.go_to("https://example.com")

# Limpar
await tab.remove_callback(callback_id)
await tab.disable_network_events()
```

### 3. Use Filtragem Precoce

```python
from pydoll.protocol.network.events import RequestWillBeSentEvent

# Bom: filtrar cedo
async def handle_api_request(event: RequestWillBeSentEvent):
    url = event['params']['request']['url']
    if '/api/' not in url:
        return  # Sair cedo
    
    # Processar apenas requisições de API
    process_request(event)

# Ruim: processa tudo
async def handle_all_requests(event: RequestWillBeSentEvent):
    url = event['params']['request']['url']
    process_request(event)
    if '/api/' in url:
        do_extra_work(event)
```

### 4. Lide com Erros Graciosamente

```python
from pydoll.protocol.network.events import ResponseReceivedEvent

async def safe_callback(event: ResponseReceivedEvent):
    try:
        request_id = event['params']['requestId']
        body = await tab.get_network_response_body(request_id)
        process_body(body)
    except KeyError:
        # Evento pode não ter requestId
        pass
    except Exception as e:
        print(f"Erro no callback: {e}")
        # Continuar sem quebrar o loop de eventos
```

## Considerações de Desempenho

!!! warning "Eventos de Alta Frequência"
    Eventos DOM podem disparar **muito frequentemente** em páginas dinâmicas. Use filtragem e debouncing para evitar problemas de desempenho.

### Volume de Eventos por Domínio

| Domínio | Frequência de Eventos | Impacto no Desempenho |
|---|---|---|
| Page | Baixa | Mínimo |
| Network | Moderada-Alta | Moderado |
| DOM | Muito Alta | Alto |
| Fetch | Moderada | Moderado |

### Dicas de Otimização

1.  **Habilite apenas o que você precisa**: Não habilite todos os domínios de uma vez
2.  **Use callbacks temporários**: Limpeza automática quando possível
3.  **Filtre cedo**: Verifique condições antes de operações caras
4.  **Desabilite quando terminar**: Libere recursos
5.  **Evite processamento pesado**: Mantenha callbacks rápidos, descarregue o trabalho para tarefas separadas

```python
import asyncio
from pydoll.protocol.network.events import ResponseReceivedEvent

# Bom: callback rápido, descarrega trabalho pesado
async def handle_response(event: ResponseReceivedEvent):
    if should_process(event):
        asyncio.create_task(heavy_processing(event))  # Não bloqueie

# Ruim: bloqueia o loop de eventos
async def handle_response(event: ResponseReceivedEvent):
    await heavy_processing(event)  # Bloqueia outros eventos
```

## Padrões Comuns

### Gerenciador de Contexto para Eventos

```python
from contextlib import asynccontextmanager
from pydoll.protocol.network.events import NetworkEvent, RequestWillBeSentEvent

@asynccontextmanager
async def monitor_requests(tab):
    """Gerenciador de contexto para monitorar requisições durante um bloco."""
    requests = []
    
    async def capture(event: RequestWillBeSentEvent):
        requests.append(event['params']['request'])
    
    await tab.enable_network_events()
    cb_id = await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, capture)
    
    try:
        yield requests
    finally:
        await tab.remove_callback(cb_id)
        await tab.disable_network_events()

# Uso
async with monitor_requests(tab) as requests:
    await tab.go_to("https://example.com")
    # Todas as requisições são capturadas

print(f"Capturadas {len(requests)} requisições")
```

### Registro Condicional de Eventos

```python
from pydoll.protocol.network.events import NetworkEvent
from pydoll.protocol.dom.events import DomEvent

async def setup_monitoring(tab, track_network=False, track_dom=False):
    """Habilitar apenas o monitoramento especificado."""
    callbacks = []
    
    if track_network:
        await tab.enable_network_events()
        cb = await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, log_request)
        callbacks.append(('network', cb))
    
    if track_dom:
        await tab.enable_dom_events()
        cb = await tab.on(DomEvent.ATTRIBUTE_MODIFIED, log_dom_change)
        callbacks.append(('dom', cb))
    
    return callbacks
```

## Leitura Adicional

- **[Análise Profunda da Arquitetura de Eventos](../../deep-dive/event-architecture.md)** - Implementação interna e comunicação WebSocket
- **[Monitoramento de Rede](../network/monitoring.md)** - Técnicas avançadas de análise de rede
- **[Automação Reativa](reactive-automation.md)** - Construindo fluxos de trabalho orientados a eventos

!!! tip "Comece Simples"
    Comece com eventos de Página (Page) para entender o básico, depois passe para eventos de Rede (Network) e DOM conforme necessário. O sistema de eventos é poderoso, mas pode ser intimidador no início.

================================================
FILE: docs/pt/features/advanced/remote-connections.md
================================================
# Conexões Remotas e Automação Híbrida

O Pydoll permite que você se conecte a navegadores já em execução via WebSocket, habilitando cenários de controle remoto e automação híbrida. Isso é perfeito para pipelines de CI/CD, ambientes contêinerizados, sessões de depuração e integração do Pydoll com ferramentas CDP existentes.

!!! info "Nenhuma Configuração Necessária"
    Diferente da automação tradicional que inicia navegadores, conexões remotas permitem controlar navegadores que já estão rodando. Nenhum gerenciamento de processo é necessário!

## Por que Conexões Remotas?

Conexões remotas desbloqueiam cenários poderosos de automação:

| Caso de Uso | Benefício |
|---|---|
| **Pipelines de CI/CD** | Conecte-se a contêineres de navegador sem gerenciar processos |
| **Ambientes Docker** | Controle navegadores rodando em contêineres separados |
| **Depuração Remota** | Automatize navegadores em servidores remotos ou VMs |
| **Ferramental Híbrido** | Integre o Pydoll com sua infraestrutura CDP existente |
| **Desenvolvimento** | Anexe ao seu navegador local para testes rápidos |
| **Automação Multi-Ferramenta** | Compartilhe sessões de navegador entre diferentes ferramentas |

## Configurando um Servidor de Navegador Remoto

!!! tip "Já Tem um Serviço de Navegador Remoto?"
    Se você está usando um serviço de navegador na nuvem (BrowserStack, Selenium Grid, LambdaTest, etc.) ou já tem uma instância do Chrome rodando com uma URL WebSocket, você pode **pular esta seção inteira** e ir direto para [Métodos de Conexão](#métodos-de-conexão) para aprender como se conectar com o Pydoll.

Antes de poder se conectar remotamente, você precisa iniciar o Chrome com a depuração habilitada e configurado corretamente para aceitar conexões externas.

### Configuração Básica do Servidor (Linux)

Inicie o Chrome com depuração remota em um servidor:

```bash
# Configuração básica - acessível apenas do localhost
google-chrome \
  --remote-debugging-port=9222 \
  --headless=new \
  --no-sandbox \
  --disable-dev-shm-usage \
  --user-data-dir=/tmp/chrome-profile

# Configuração do servidor - acessível de outras máquinas
google-chrome \
  --remote-debugging-port=9222 \
  --remote-debugging-address=0.0.0.0 \
  --headless=new \
  --no-sandbox \
  --disable-dev-shm-usage \
  --user-data-dir=/tmp/chrome-profile
```

!!! warning "Criticidade de Segurança"
    Usar `--remote-debugging-address=0.0.0.0` torna a porta de depuração acessível de **qualquer interface de rede**. Isso é necessário para conexões remotas, mas cria um risco de segurança significativo se exposto à internet.

### Configuração Recomendada do Servidor

```bash
# Configuração pronta para produção
google-chrome \
  --remote-debugging-port=9222 \
  --remote-debugging-address=0.0.0.0 \
  --headless=new \
  --no-sandbox \
  --disable-dev-shm-usage \
  --disable-gpu \
  --disable-software-rasterizer \
  --disable-extensions \
  --disable-background-networking \
  --disable-background-timer-throttling \
  --disable-client-side-phishing-detection \
  --disable-popup-blocking \
  --disable-prompt-on-repost \
  --disable-sync \
  --metrics-recording-only \
  --no-first-run \
  --safebrowsing-disable-auto-update \
  --user-data-dir=/tmp/chrome-remote-$(date +%s)
```

**Flags chave explicadas:**

| Flag | Propósito |
|---|---|
| `--remote-debugging-port=9222` | Habilita o CDP na porta 9222 |
| `--remote-debugging-address=0.0.0.0` | Permite conexões externas (risco de segurança!) |
| `--headless=new` | Executa sem GUI (modo servidor) |
| `--no-sandbox` | Necessário em Docker/contêineres (trade-off de segurança) |
| `--disable-dev-shm-usage` | Previne problemas de memória /dev/shm em contêineres |
| `--disable-gpu` | Sem aceleração por GPU (recomendado para headless) |
| `--user-data-dir=/tmp/...` | Perfil isolado por instância |

!!! warning "Sobre a Flag --no-sandbox"
    A flag `--no-sandbox` desabilita o sandbox de segurança do Chrome, que isola o processo do navegador do sistema. Esta flag é **necessária** na maioria dos ambientes Docker/contêineres devido a restrições de capacidade do kernel, mas traz implicações de segurança:
    
    - **Risco**: Remove o isolamento entre o navegador e o sistema
    - **Quando usar**: Contêineres Docker, ambientes restritos
    - **Mitigação**: Garanta isolamento em nível de contêiner (namespaces, cgroups) e evite rodar como root
    
    Considere usar `--no-sandbox` apenas quando absolutamente necessário e implemente camadas adicionais de segurança no nível do contêiner.

### Configuração do Docker

Crie um servidor Chrome contêinerizado:

!!! tip "Usando Imagens Prontas"
    Para produção, considere usar imagens oficiais pré-construídas em vez de construir a sua própria:
    
    - **Imagens Selenium**: `selenium/standalone-chrome` (inclui WebDriver)
    - **Zenika Alpine Chrome**: `zenika/alpine-chrome` (leve, ~200MB)
    - **Browserless**: `browserless/chrome` (pronto para produção com monitoramento)
    
    Essas imagens são atualizadas regularmente, testadas em segurança e otimizadas para ambientes de contêiner.

**Dockerfile (Build Personalizado):**
```dockerfile
FROM ubuntu:22.04

# Instalar Chrome
RUN apt-get update && apt-get install -y \
    wget \
    gnupg \
    ca-certificates \
    && wget -q -O - https://dl.google.com/linux/linux_signing_key.pub | apt-key add - \
    && echo "deb [arch=amd64] http://dl.google.com/linux/chrome/deb/ stable main" >> /etc/apt/sources.list.d/google.list \
    && apt-get update \
    && apt-get install -y google-chrome-stable \
    && rm -rf /var/lib/apt/lists/*

# Expor porta de depuração
EXPOSE 9222

# Iniciar Chrome com depuração remota
CMD ["google-chrome", \
     "--remote-debugging-port=9222", \
     "--remote-debugging-address=0.0.0.0", \
     "--headless=new", \
     "--no-sandbox", \
     "--disable-dev-shm-usage", \
     "--disable-gpu", \
     "--user-data-dir=/tmp/chrome-profile"]
```

**docker-compose.yml:**
```yaml
services:
  chrome-server:
    build: .
    ports:
      - "127.0.0.1:9222:9222"
    
    # Descomente a linha abaixo SOMENTE se precisar de acesso remoto
    # E tiver protegido a porta com firewall ou proxy.
    # - "9222:9222"

    shm_size: '2gb'  # Crítico: Chrome usa /dev/shm para memória compartilhada
                      # O shm_size padrão do Docker (64MB) é insuficiente
    restart: unless-stopped
    environment:
      - DISPLAY=:99
    networks:
      - automation-network
    # Opcional: Limites de recursos para produção
    # deploy:
    #   resources:
    #     limits:
    #       cpus: '2'
    #       memory: 4G

  automation-client:
    image: python:3.11
    depends_on:
      - chrome-server
    volumes:
      - ./:/app
    working_dir: /app
    command: python automation_script.py
    environment:
      - CHROME_WS=ws://chrome-server:9222/devtools/browser
    networks:
      - automation-network

networks:
  automation-network:
    driver: bridge
```

**Uso:**
```bash
# Iniciar a stack
docker-compose up -d

# Verificar se o Chrome está rodando
curl http://localhost:9222/json/version

# Conectar do cliente de automação (dentro da rede Docker)
# ws://chrome-server:9222/devtools/browser/...
```

### Serviço Systemd (Servidor Linux)

Crie um serviço Chrome persistente:

**/etc/systemd/system/chrome-remote.service:**
```ini
[Unit]
Description=Chrome Remote Debugging Server
After=network.target

[Service]
Type=simple
User=chrome-user
Group=chrome-user
Environment="DISPLAY=:99"
ExecStart=/usr/bin/google-chrome \
    --remote-debugging-port=9222 \
    --remote-debugging-address=0.0.0.0 \
    --headless=new \
    --no-sandbox \
    --disable-dev-shm-usage \
    --disable-gpu \
    --user-data-dir=/var/lib/chrome-remote
Restart=always
RestartSec=10

[Install]
WantedBy=multi-user.target
```

**Configuração e gerenciamento:**
```bash
# Criar usuário dedicado
sudo useradd -r -s /bin/false chrome-user
sudo mkdir -p /var/lib/chrome-remote
sudo chown chrome-user:chrome-user /var/lib/chrome-remote

# Instalar e habilitar serviço
sudo systemctl daemon-reload
sudo systemctl enable chrome-remote
sudo systemctl start chrome-remote

# Verificar status
sudo systemctl status chrome-remote

# Ver logs
sudo journalctl -u chrome-remote -f

# Reiniciar serviço
sudo systemctl restart chrome-remote
```

### Configuração de Segurança de Rede

#### Regras de Firewall (iptables)

```bash
# Permitir que apenas IPs específicos acessem a porta 9222
sudo iptables -A INPUT -p tcp --dport 9222 -s 192.168.1.100 -j ACCEPT
sudo iptables -A INPUT -p tcp --dport 9222 -j DROP

# Salvar regras
sudo iptables-save > /etc/iptables/rules.v4
```

#### Regras de Firewall (ufw)

```bash
# Negar todo o acesso à porta 9222 por padrão
sudo ufw deny 9222

# Permitir IP específico
sudo ufw allow from 192.168.1.100 to any port 9222

# Permitir sub-rede específica
sudo ufw allow from 192.168.1.0/24 to any port 9222

# Habilitar firewall
sudo ufw enable
```

#### Proxy Reverso Nginx (com Autenticação)

Proteja a depuração do Chrome com autenticação HTTP:

**/etc/nginx/sites-available/chrome-remote:**
```nginx
server {
    listen 80;
    server_name chrome.example.com;

    # Autenticação básica
    auth_basic "Chrome Remote Debugging";
    auth_basic_user_file /etc/nginx/.htpasswd;

    location / {
        proxy_pass http://localhost:9222;
        proxy_http_version 1.1;
        proxy_set_header Upgrade $http_upgrade;
        proxy_set_header Connection "upgrade";
        proxy_set_header Host $host;
        proxy_set_header X-Real-IP $remote_addr;
        proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
        proxy_read_timeout 86400;
    }
}
```

**Configuração:**
```bash
# Criar arquivo de senha
sudo htpasswd -c /etc/nginx/.htpasswd admin

# Habilitar site
sudo ln -s /etc/nginx/sites-available/chrome-remote /etc/nginx/sites-enabled/
sudo nginx -t
sudo systemctl reload nginx

# Conectar com autenticação
# ws://admin:password@chrome.example.com/devtools/browser/...
```

### Conectando de Outro Computador

Uma vez que seu servidor esteja configurado, conecte-se da sua máquina cliente:

```python
import asyncio
import aiohttp
from pydoll.browser.chromium import Chrome

async def connect_to_remote_server():
    """Conectar ao Chrome rodando em um servidor remoto."""
    # IP e porta do servidor
    server_ip = "192.168.1.100"
    server_port = 9222

    async with aiohttp.ClientSession() as session:
        # Consultar o servidor por alvos disponíveis
        url = f"http://{server_ip}:{server_port}/json/version"
        
        async with session.get(url) as response:
            data = await response.json()
            ws_url = data['webSocketDebuggerUrl']
            
            print(f"Informações do servidor:")
            print(f"  Navegador: {data.get('Browser')}")
            print(f"  Protocolo: {data.get('Protocol-Version')}")
            print(f"  WebSocket: {ws_url}")
    
    # 2. Conectar ao navegador
    chrome = Chrome()
    tab = await chrome.connect(ws_url)
    
    print(f"\n[SUCESSO] Conectado ao servidor Chrome remoto!")
    
    # 3. Usar normalmente
    await tab.go_to('https://example.com')
    title = await tab.execute_script('return document.title')
    print(f"Título da página: {title}")
    
    # 4. Limpeza
    await chrome.close()

asyncio.run(connect_to_remote_server())
```

### Testando a Configuração do Seu Servidor

```bash
# 1. Verificar se o Chrome está rodando
ps aux | grep chrome

# 2. Verificar se a porta está escutando
netstat -tulpn | grep 9222
# Ou
ss -tulpn | grep 9222

# 3. Testar acesso local
curl http://localhost:9222/json/version

# 4. Testar acesso remoto (da máquina cliente)
curl http://SERVER_IP:9222/json/version

# 5. Verificar URL do WebSocket
curl http://SERVER_IP:9222/json/version | jq -r '.webSocketDebuggerUrl'

# 6. Listar todos os alvos disponíveis (abas/páginas)
curl http://SERVER_IP:9222/json/list
```

### Configuração de Múltiplas Instâncias

Execute múltiplas instâncias do Chrome em portas diferentes:

```bash
#!/bin/bash
# start-chrome-pool.sh

for port in 9222 9223 9224 9225; do
    google-chrome \
        --remote-debugging-port=$port \
        --remote-debugging-address=0.0.0.0 \
        --headless=new \
        --no-sandbox \
        --disable-dev-shm-usage \
        --user-data-dir=/tmp/chrome-$port &
    
    echo "Iniciado Chrome na porta $port"
done

echo "Pool de Chrome pronto. Portas: 9222-9225"
```

**Cliente Python com pool:**
```python
import asyncio
from pydoll.browser.chromium import Chrome
import aiohttp

async def connect_to_pool(server_ip: str, ports: list[int]):
    """Conectar a múltiplas instâncias do Chrome."""
    tasks = []
    
    for port in ports:
        task = connect_to_instance(server_ip, port)
        tasks.append(task)
    
    results = await asyncio.gather(*tasks)
    return results

async def connect_to_instance(server_ip: str, port: int):
    """Conectar a uma única instância do Chrome."""
    # Obter URL do WebSocket
    async with aiohttp.ClientSession() as session:
        url = f"http://{server_ip}:{port}/json/version"
        async with session.get(url) as response:
            data = await response.json()
            ws_url = data['webSocketDebuggerUrl']
    
    # Conectar
    chrome = Chrome()
    tab = await chrome.connect(ws_url)
    
    # Rodar automação
    await tab.go_to('https://example.com')
    title = await tab.execute_script('return document.title')
    
    print(f"Porta {port}: {title}")
    
    await chrome.close()
    return title

# Uso
asyncio.run(connect_to_pool('192.168.1.100', [9222, 9223, 9224, 9225]))
```

## Métodos de Conexão

O Pydoll oferece duas abordagens para conexões remotas, cada uma adequada para cenários diferentes.

### Método 1: Conexão no Nível do Navegador

Conecte-se a um navegador em execução usando seu endpoint WebSocket e tenha acesso a todas as abas abertas:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def connect_to_remote_browser():
    chrome = Chrome()
    
    # Conectar ao navegador remoto via WebSocket
    tab = await chrome.connect('ws://localhost:9222/devtools/browser/XXXX')
    
    # A aba retornada é a primeira aba disponível
    print(f"Conectado à aba: {await tab.execute_script('return document.title')}")
    
    # Você pode obter todas as outras abas também
    all_tabs = await chrome.get_opened_tabs()
    print(f"Total de abas disponíveis: {len(all_tabs)}")
    
    # Use a aba normalmente
    await tab.go_to('https://example.com')
    element = await tab.find(id='main-content')
    text = await element.text
    print(f"Conteúdo: {text}")
    
    # Limpeza
    await chrome.close()

asyncio.run(connect_to_remote_browser())
```

!!! tip "Obtendo a URL do WebSocket"
    Inicie o Chrome com a depuração habilitada:
    ```bash
    # Linux/Mac
    google-chrome --remote-debugging-port=9222
    
    # Windows
    "C:\Program Files\Google\Chrome\Application\chrome.exe" --remote-debugging-port=9222
    ```
    
    **Para conexões locais** (mesma máquina):
    
    - Visite `http://localhost:9222/json/version` no seu navegador para obter a URL do WebSocket no campo `webSocketDebuggerUrl`
    - Ou consulte programaticamente como mostrado no exemplo acima usando `aiohttp`
    - Para depuração rápida, você também pode verificar `browser._connection_port` após iniciar uma instância local do navegador
    
    **Para conexões remotas** (máquina diferente):
    
    - Consulte `http://SERVER_IP:9222/json/version` da sua máquina cliente
    - Use a `webSocketDebuggerUrl` da resposta, substituindo `localhost` pelo IP real do servidor, se necessário

### Método 2: Controle Direto de Elemento (Abordagem Híbrida)

Se você já tem sua própria integração CDP ou ferramentas de baixo nível, pode envolver elementos existentes com a API de alto nível do Pydoll:

```python
import asyncio
import json
from pydoll.connection.connection_handler import ConnectionHandler
from pydoll.elements.web_element import WebElement

async def custom_cdp_integration():
    """Use o Pydoll junto com sua implementação CDP personalizada."""
    # Sua configuração CDP existente encontrou um elemento
    page_ws = 'ws://localhost:9222/devtools/page/ABC123'
    
    # Você usou Runtime.evaluate para encontrar um elemento
    # e obteve seu objectId
    element_object_id = '{\"injectedScriptId\":1,\"id\":1}'
    
    # Criar conexão Pydoll
    connection = ConnectionHandler(ws_address=page_ws)
    
    # Envolver o elemento
    button = WebElement(
        object_id=element_object_id,
        connection_handler=connection
    )
    
    # Usar os métodos de alto nível do Pydoll
    await button.wait_until(is_visible=True, timeout=5)
    await button.wait_until(is_interactable=True)
    
    # Clicar com deslocamento realista
    await button.click(offset_x=5, offset_y=5)
    
    # Obter propriedades computadas facilmente
    is_enabled = await button.is_enabled()
    bounds = await button.bounds
    
    print(f"Botão clicado! Habilitado: {is_enabled}, Limites: {bounds}")
    
    # Limpeza
    await connection.close()

asyncio.run(custom_cdp_integration())
```

!!! tip "Formato do Object ID"
    O `objectId` é uma string retornada por comandos CDP como `Runtime.evaluate` ou `DOM.resolveNode`. Geralmente é uma string JSON com campos como `injectedScriptId` e `id`.


!!! info "O Melhor dos Dois Mundos"
    Esta abordagem híbrida permite que você aproveite sua infraestrutura CDP existente enquanto se beneficia da API ergonômica de elementos do Pydoll para interações, esperas e acesso a propriedades.

## Considerações de Segurança

!!! danger "Ambientes de Produção"
    Portas de depuração remota expõem **controle total** sobre o navegador, incluindo:
    
    - Acesso a todas as páginas e dados
    - Capacidade de executar JavaScript arbitrário
    - Acesso a cookies e sessões
    - Acesso ao sistema de arquivos via downloads
    
    **Nunca exponha portas de depuração à internet sem autenticação adequada e segurança de rede!**

### Práticas de Segurança Recomendadas

| Prática | Por quê | Como |
|---|---|---|
| **Túneis SSH** | Criptografa o tráfego e autentica | `ssh -L 9222:localhost:9222 user@host` |
| **VPN** | Segurança em nível de rede | Conectar via VPN corporativa/privada |
| **Regras de Firewall** | Restringir acesso | Permitir apenas IPs específicos |
| **Redes Docker** | Isolamento de contêiner | Usar redes Docker privadas |
| **Sem Exposição Pública** | Prevenir ataques | Nunca fazer bind para `0.0.0.0` em produção |

## Leitura Adicional

- **[Sistema de Eventos](event-system.md)** - Monitore eventos remotos do navegador
- **[Monitoramento de Rede](../network/monitoring.md)** - Rastreie requisições em navegadores remotos
- **[Opções do Navegador](../configuration/browser-options.md)** - Configure navegadores locais antes de iniciar

!!! tip "Comece Local, Escale Remotamente"
    Desenvolva sua automação localmente com `browser.start()` para iterações rápidas, depois implante com `browser.connect()` para pipelines de CI/CD de produção e ambientes contêinerizados.

================================================
FILE: docs/pt/features/automation/file-operations.md
================================================
# Operações com Arquivos

Uploads de arquivos são um dos aspectos mais desafiadores da automação de navegadores. Ferramentas tradicionais frequentemente têm dificuldades com as caixas de diálogo de arquivo do nível do sistema operacional, exigindo soluções complexas ou bibliotecas externas. O Pydoll oferece duas abordagens diretas para lidar com uploads de arquivos, cada uma adequada para cenários diferentes.

## Métodos de Upload

O Pydoll suporta dois métodos principais para uploads de arquivos:

1.  **Entrada direta de arquivo** (`set_input_files()`): Rápido e direto, funciona com elementos `<input type="file">`
2.  **Gerenciador de contexto de seletor de arquivo** (`expect_file_chooser()`): Intercepta a caixa de diálogo de arquivo, funciona com qualquer gatilho de upload

## Entrada Direta de Arquivo

A abordagem mais simples é usar `set_input_files()` diretamente em elementos de entrada de arquivo. Este método é rápido, confiável e ignora totalmente a caixa de diálogo de arquivo do sistema operacional.

### Uso Básico

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def direct_file_upload():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/upload')
        
        # Encontrar o elemento de entrada de arquivo
        file_input = await tab.find(tag_name='input', type='file')
        
        # Definir o arquivo diretamente
        file_path = Path('path/to/document.pdf')
        await file_input.set_input_files(file_path)
        
        # Enviar o formulário
        submit_button = await tab.find(id='submit-button')
        await submit_button.click()
        
        print("Arquivo enviado com sucesso!")

asyncio.run(direct_file_upload())
```

!!! tip "Path vs String"
    Embora objetos `Path` do `pathlib` sejam recomendados como melhor prática para melhor manipulação de caminhos e compatibilidade entre plataformas, você também pode usar strings simples, se preferir:
    ```python
    await file_input.set_input_files('path/to/document.pdf')  # Também funciona!
    ```

### Múltiplos Arquivos

Para entradas que aceitam múltiplos arquivos (`<input type="file" multiple>`), passe uma lista de caminhos de arquivo:

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def upload_multiple_files():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/multi-upload')
        
        file_input = await tab.find(tag_name='input', type='file')
        
        # Fazer upload de múltiplos arquivos de uma vez
        files = [
            Path('documents/report.pdf'),
            Path('images/screenshot.png'),
            Path('data/results.csv')
        ]
        await file_input.set_input_files(files)
        
        # Processar normalmente
        upload_btn = await tab.find(id='upload-btn')
        await upload_btn.click()

asyncio.run(upload_multiple_files())
```

### Resolução Dinâmica de Caminho

Objetos `Path` facilitam a construção dinâmica de caminhos e lidam com a compatibilidade entre plataformas:

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def upload_with_dynamic_paths():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/upload')
        
        file_input = await tab.find(tag_name='input', type='file')
        
        # Construir caminhos dinamicamente
        project_dir = Path(__file__).parent
        file_path = project_dir / 'uploads' / 'data.json'

        await file_input.set_input_files(file_path)
        # Ou usar o diretório home
        user_file = Path.home() / 'Documents' / 'report.pdf'
        await file_input.set_input_files(user_file)

asyncio.run(upload_with_dynamic_paths())
```

!!! tip "Quando Usar a Entrada Direta de Arquivo"
    Use `set_input_files()` quando:
    
    - O input de arquivo está diretamente acessível no DOM
    - Você quer velocidade e simplicidade máximas
    - O upload não dispara uma caixa de diálogo de seletor de arquivo
    - Você está trabalhando com elementos `<input type="file">` padrão

## Gerenciador de Contexto de Seletor de Arquivo

Alguns sites escondem o input de arquivo e usam botões personalizados ou áreas de arrastar e soltar que disparam a caixa de diálogo de seletor de arquivo do sistema operacional. Para esses casos, use o gerenciador de contexto `expect_file_chooser()`.

### Como Funciona

O gerenciador de contexto `expect_file_chooser()`:

1.  Habilita a interceptação do seletor de arquivo
2.  Espera a caixa de diálogo do seletor de arquivo abrir
3.  Define automaticamente os arquivos quando a caixa de diálogo aparece
4.  Limpa os recursos após a conclusão da operação

### Uso Básico

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def file_chooser_upload():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/custom-upload')
        
        # Preparar o caminho do arquivo
        file_path = Path.cwd() / 'document.pdf'
        
        # Usar gerenciador de contexto para lidar com o seletor de arquivo
        async with tab.expect_file_chooser(files=file_path):
            # Clicar no botão de upload personalizado
            upload_button = await tab.find(class_name='custom-upload-btn')
            await upload_button.click()
            # O arquivo é definido automaticamente quando a caixa de diálogo abre
        
        # Continuar com sua automação
        print("Arquivo selecionado via seletor!")

asyncio.run(file_chooser_upload())
```

### Múltiplos Arquivos com Seletor de Arquivo

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def multiple_files_chooser():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/gallery-upload')
        
        # Preparar múltiplos arquivos
        photos_dir = Path.home() / 'photos'
        files = [
            photos_dir / 'img1.jpg',
            photos_dir / 'img2.jpg',
            photos_dir / 'img3.jpg'
        ]
        
        async with tab.expect_file_chooser(files=files):
            # Disparar upload via botão personalizado
            add_photos_btn = await tab.find(text='Add Photos')
            await add_photos_btn.click()
        
        print(f"{len(files)} arquivos selecionados!")

asyncio.run(multiple_files_chooser())
```

### Seleção Dinâmica de Arquivos

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def dynamic_file_selection():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/batch-upload')
        
        # Encontrar todos os arquivos CSV em um diretório usando Path.glob()
        data_dir = Path('data')
        csv_files = list(data_dir.glob('*.csv'))
        
        async with tab.expect_file_chooser(files=csv_files):
            upload_area = await tab.find(class_name='drop-zone')
            await upload_area.click()
        
        print(f"Selecionados {len(csv_files)} arquivos CSV")

asyncio.run(dynamic_file_selection())
```

!!! tip "Quando Usar o Seletor de Arquivo"
    Use `expect_file_chooser()` quando:
    
    - O input de arquivo está oculto ou não diretamente acessível
    - Botões personalizados disparam a caixa de diálogo do seletor de arquivo
    - Trabalhando com áreas de upload de arrastar e soltar
    - O site usa JavaScript para abrir caixas de diálogo de arquivo

## Comparação: Direto vs Seletor de Arquivo

| Característica | `set_input_files()` | `expect_file_chooser()` |
|---|---|---|
| **Velocidade** | ⚡ Instantâneo | 🕐 Espera pela caixa de diálogo |
| **Complexidade** | Simples | Requer gerenciador de contexto |
| **Requisitos** | Input de arquivo visível | Qualquer gatilho de upload |
| **Caso de Uso** | Formulários padrão | UIs de upload personalizadas |
| **Manejo de Eventos** | Não necessário | Usa eventos de página |

## Exemplo Completo

Aqui está um exemplo abrangente combinando ambas as abordagens:

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def comprehensive_upload_example():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/upload-form')
        
        # Cenário 1: Entrada direta para foto de perfil (arquivo único)
        avatar_input = await tab.find(id='avatar-upload')
        avatar_path = Path.home() / 'Pictures' / 'profile.jpg'
        await avatar_input.set_input_files(avatar_path)
        
        # Esperar um pouco para a pré-visualização carregar
        await asyncio.sleep(1)
        
        # Cenário 2: Seletor de arquivo para upload de documento
        document_path = Path.cwd() / 'documents' / 'resume.pdf'
        async with tab.expect_file_chooser(files=document_path):
            # Botão estilizado personalizado que dispara o seletor de arquivo
            upload_btn = await tab.find(class_name='btn-upload-document')
            await upload_btn.click()
        
        # Esperar pela confirmação do upload
        await asyncio.sleep(2)
        
        # Cenário 3: Múltiplos arquivos via seletor de arquivo
        certs_dir = Path('certs')
        certificates = [
            certs_dir / 'certificate1.pdf',
            certs_dir / 'certificate2.pdf',
            certs_dir / 'certificate3.pdf'
        ]
        async with tab.expect_file_chooser(files=certificates):
            add_certs_btn = await tab.find(text='Add Certificates')
            await add_certs_btn.click()
        
        # Enviar o formulário completo
        submit_button = await tab.find(type='submit')
        await submit_button.click()
        
        # Esperar pela mensagem de sucesso
        success_msg = await tab.find(class_name='success-message', timeout=10)
        message_text = await success_msg.text
        print(f"Resultado do upload: {message_text}")

asyncio.run(comprehensive_upload_example())
```

!!! info "Resumo dos Métodos"
    Este exemplo demonstra a flexibilidade do sistema de upload de arquivos do Pydoll:
    
    - **Arquivos únicos**: Passe `Path` ou `str` diretamente (não precisa de lista)
    - **Múltiplos arquivos**: Passe uma lista de objetos `Path` ou `str`
    - **Entrada direta**: Rápido para elementos `<input>` visíveis
    - **Seletor de arquivo**: Funciona com botões de upload personalizados e inputs ocultos

## Aprenda Mais

Para um entendimento mais profundo dos mecanismos de upload de arquivos:

- **[Sistema de Eventos](../advanced/event-system.md)**: Aprenda sobre os eventos de página usados pelo `expect_file_chooser()`
- **[Análise Profunda: Domínio da Aba](../../deep-dive/tab-domain.md#file-chooser-handling)**: Detalhes técnicos sobre a interceptação do seletor de arquivo
- **[Análise Profunda: Sistema de Eventos](../../deep-dive/event-system.md#file-chooser-events)**: Como os eventos do seletor de arquivo funcionam internamente

As operações com arquivos no Pydoll eliminam um dos maiores pontos problemáticos na automação de navegadores, fornecendo métodos limpos e confiáveis tanto para cenários de upload simples quanto complexos.

================================================
FILE: docs/pt/features/automation/human-interactions.md
================================================
# Interações Semelhantes a Humanas

Um dos principais diferenciais entre uma automação bem-sucedida e bots facilmente detectados é o quão realistas são as interações. O Pydoll fornece ferramentas sofisticadas para tornar sua automação virtualmente indistinguível do comportamento humano.

!!! info "Status das Funcionalidades"
    **Já Implementado:**

    - **Teclado Humanizado**: Velocidade de digitação variável, erros realistas com correção automática (passe `humanize=True`)
    - **Scroll Humanizado**: Rolagem baseada em física com momentum, fricção, jitter e overshoot (passe `humanize=True`)
    - **Mouse Humanizado**: Trajetórias com curvas de Bezier, temporização pela Lei de Fitts, velocidade minimum-jerk, tremor e overshoot (passe `humanize=True`)

    **Em Breve:**

    - **Deslocamentos de clique aleatórios automáticos**: Parâmetro opcional para randomizar automaticamente as posições de clique dentro dos elementos
    - **Comportamento de hover**: Atrasos e movimentos realistas ao passar o mouse sobre elementos

## Por que Interações Semelhantes a Humanas Importam

Sites modernos empregam técnicas sofisticadas de detecção de bots:

- **Análise de tempo de eventos**: Detectando ações impossivelmente rápidas ou perfeitamente cronometradas
- **Rastreamento de movimento do mouse**: Identificando movimentos em linha reta ou teletransporte instantâneo
- **Padrões de teclado**: Percebendo inserção de texto instantânea sem pressionamentos de tecla individuais
- **Posições de clique**: Detectando cliques sempre no centro exato dos elementos
- **Sequências de ação**: Identificando padrões não humanos no comportamento do usuário

O Pydoll ajuda você a evitar a detecção, fornecendo métodos de interação realistas que imitam o comportamento real do usuário.

## Movimento Realista do Mouse

A API de Mouse (`tab.mouse`) fornece controle humanizado do cursor com múltiplas camadas de realismo. Quando `humanize=True`, os movimentos do mouse seguem trajetórias naturais com curvas de Bezier, temporização pela Lei de Fitts, perfis de velocidade minimum-jerk, tremor fisiológico e correção de overshoot.

```python
from pydoll.browser.chromium import Chrome

async with Chrome() as browser:
    tab = await browser.start()
    await tab.go_to('https://example.com')

    # Mover com trajetória curva natural
    await tab.mouse.move(500, 300, humanize=True)

    # Clicar com movimento, deslocamento e temporização realistas
    await tab.mouse.click(500, 300, humanize=True)

    # Arrastar com movimento natural
    await tab.mouse.drag(100, 200, 500, 400, humanize=True)
```

Técnicas aplicadas durante operações humanizadas do mouse:

- **Trajetórias com curvas de Bezier**: Trajetórias curvas com pontos de controle assimétricos (mais curvatura no início do movimento)
- **Temporização pela Lei de Fitts**: A duração do movimento escala com a distância: `MT = a + b × log₂(D/W + 1)`
- **Velocidade minimum-jerk**: Perfil de velocidade em forma de sino, início lento, pico no meio, fim lento
- **Tremor fisiológico**: Ruído gaussiano (σ ≈ 1px) escalado inversamente com a velocidade
- **Overshoot e correção**: ~70% de chance de ultrapassar movimentos rápidos em 3–12%, depois corrigir
!!! info "Documentação Dedicada de Controle do Mouse"
    Para documentação completa sobre controle do mouse, incluindo todos os métodos, configuração personalizada de temporização, rastreamento de posição e modo debug, veja **[Controle do Mouse](mouse-control.md)**.

## Cliques Realistas

### Clique Básico com Eventos de Mouse Simulados

O método `click()` simula eventos reais de pressionar e soltar o mouse, diferentemente de cliques baseados em JavaScript:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def realistic_clicking():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        button = await tab.find(id="submit-button")
        
        # Clique realista básico
        await button.click()
        
        # O clique inclui:
        # - Movimento do mouse até o elemento
        # - Evento de pressionar o mouse
        # - Tempo de espera (hold) configurável
        # - Evento de soltar o mouse

asyncio.run(realistic_clicking())
```

### Clique com Deslocamento de Posição (Offset)

Usuários reais raramente clicam no centro exato dos elementos. Use deslocamentos para variar as posições dos cliques:

!!! info "Estado Atual: Cálculo Manual de Deslocamento"
    Atualmente, você deve calcular manualmente e randomizar os deslocamentos de clique para cada interação. Versões futuras incluirão um parâmetro opcional para randomizar automaticamente as posições de clique dentro dos limites do elemento.

```python
import asyncio
import random
from pydoll.browser.chromium import Chrome

async def click_with_offset():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/form')
        
        submit_button = await tab.find(tag_name="button", type="submit")
        
        # Clicar ligeiramente fora do centro (mais natural)
        await submit_button.click(
            x_offset=5,   # 5 pixels à direita do centro
            y_offset=-3   # 3 pixels acima do centro
        )
        
        # Atualmente: Varie manualmente o deslocamento para cada clique para parecer mais humano
        for item in await tab.find(class_name="clickable-item", find_all=True):
            offset_x = random.randint(-10, 10)
            offset_y = random.randint(-10, 10)
            await item.click(x_offset=offset_x, y_offset=offset_y)
            await asyncio.sleep(random.uniform(0.5, 2.0))

asyncio.run(click_with_offset())
```

### Tempo de Espera (Hold) do Clique Ajustável

Varie a duração do pressionamento do botão do mouse para simular diferentes estilos de clique:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def variable_hold_time():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        button = await tab.find(class_name="action-button")
        
        # Clique rápido (padrão é 0.1s)
        await button.click(hold_time=0.05)
        
        # Clique normal
        await button.click(hold_time=0.1)
        
        # Clique mais lento e deliberado
        await button.click(hold_time=0.2)
        
        # Simular hesitação do usuário
        await asyncio.sleep(0.8)
        await button.click(hold_time=0.15)

asyncio.run(variable_hold_time())
```

### Quando Usar click() vs click_using_js()

Entender a diferença é crucial para evitar detecção:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def click_methods_comparison():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        button = await tab.find(id="interactive-button")
        
        # Método 1: click() - Simula eventos reais do mouse
        # Dispara todos os eventos do mouse (mousedown, mouseup, click)
        # Respeita o posicionamento do elemento
        # Mais realista e mais difícil de detectar
        # Requer que o elemento esteja visível e dentro da viewport
        await button.click()
        
        # Método 2: click_using_js() - Usa JavaScript click()
        # Funciona em elementos ocultos
        # Execução mais rápida
        # Contorna sobreposições visuais
        # Pode ser detectado como automação
        # Não dispara a mesma sequência de eventos de um usuário real
        await button.click_using_js()

asyncio.run(click_methods_comparison())
```

!!! tip "Melhor Prática: Prefira Eventos do Mouse"
    Use `click()` para interações voltadas ao usuário para manter o realismo. Reserve `click_using_js()` para operações de backend, elementos ocultos, ou quando a velocidade é crítica e a detecção não é uma preocupação.

## Entrada de Texto Realista

A API de teclado do Pydoll fornece dois modos de digitação para equilibrar velocidade e furtividade.

!!! info "Entendendo os Modos de Digitação"
    | Modo | Parâmetros | Comportamento | Caso de Uso |
    |------|------------|---------------|-------------|
    | **Padrão (Rápido)** | `humanize=False` | Intervalos fixos de 50ms, sem erros | Cenários de velocidade, baixo risco (padrão) |
    | **Humanizado** | `humanize=True` | Timing variável, ~2% de taxa de erros com correção automática | **Evasão anti-bot** |

    O parâmetro `interval` está obsoleto. Passe `humanize=True` para digitação realista.

### Digitação Natural com Humanização

Quando `humanize=True` é passado, `type_text()` usa modo humanizado, simulando digitação humana realista com velocidades variáveis e erros ocasionais que são corrigidos automaticamente:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def natural_typing():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/login')
        
        username_field = await tab.find(id="username")
        password_field = await tab.find(id="password")

        # Velocidade variável: 30-120ms entre teclas
        # ~2% de taxa de erros com comportamento de correção realista
        await username_field.type_text("john.doe@example.com", humanize=True)
        await password_field.type_text("MyC0mpl3xP@ssw0rd!", humanize=True)

asyncio.run(natural_typing())
```

### Entrada Rápida para Campos Não Visíveis

Para campos que não exigem realismo (como campos ocultos ou operações de backend), use `insert_text()`:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def fast_vs_realistic_input():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/form')
        
        # Digitação realista para campos visíveis
        username = await tab.find(id="username")
        await username.click()
        await username.type_text("john_doe", interval=0.12)
        
        # Inserção rápida para campos ocultos ou de backend
        hidden_field = await tab.find(id="hidden-token")
        await hidden_field.insert_text("very-long-generated-token-12345678")
        
        # Digitação realista para campos que importam
        comment = await tab.find(id="comment-box")
        await comment.click()
        await comment.type_text("This looks like human input!", interval=0.15)

asyncio.run(fast_vs_realistic_input())
```

!!! info "Controle Avançado de Teclado"
    Para documentação abrangente sobre controle de teclado, incluindo teclas especiais, combinações de teclas, modificadores e tabelas de referência completas de teclas, veja **[Controle de Teclado](keyboard-control.md)**.

## Rolagem Realista da Página

O Pydoll fornece uma API dedicada de scroll que aguarda a conclusão da rolagem antes de prosseguir, tornando suas automações mais realistas e confiáveis.

!!! info "Entendendo os Modos de Scroll"
    A API de scroll do Pydoll oferece **três modos distintos**:

    | Modo | Parâmetros | Comportamento | Caso de Uso |
    |------|------------|---------------|-------------|
    | **Suave (Padrão)** | `smooth=True` | Animação CSS, previsível | Simulação de navegação geral (padrão) |
    | **Humanizado** | `humanize=True` | Motor de física com momentum, jitter, overshoot | **Evasão anti-bot** |
    | **Instantâneo** | `smooth=False` | Teletransporta para a posição imediatamente | Operações focadas em velocidade |

    Passe `humanize=True` para rolagem humanizada baseada em física para evasão anti-bot.

### Rolagem Básica por Direção

Use o método `scroll.by()` para rolar a página em qualquer direção com controle preciso:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.constants import ScrollPosition

async def basic_scrolling():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/long-page')
        
        # Humanizado - motor de física com curvas de Bezier
        # Inclui: momentum, fricção, jitter, micro-pausas, overshoot
        await tab.scroll.by(ScrollPosition.DOWN, 500, humanize=True)
        await tab.scroll.by(ScrollPosition.UP, 300, humanize=True)

        # Animação CSS - visual agradável mas timing previsível
        await tab.scroll.by(ScrollPosition.DOWN, 500, humanize=False, smooth=True)

        # Teletransporta instantaneamente - mais rápido mas facilmente detectável
        await tab.scroll.by(ScrollPosition.DOWN, 1000, humanize=False, smooth=False)

asyncio.run(basic_scrolling())
```

### Rolagem para Posições Específicas

Navegue para o topo ou o final da página com controle sobre o realismo:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def scroll_to_positions():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/article')
        
        # Ler o início do artigo
        await asyncio.sleep(2.0)
        
        # Scroll humanizado (motor de física, evasão anti-bot)
        await tab.scroll.to_bottom(humanize=True)
        await asyncio.sleep(1.5)
        await tab.scroll.to_top(humanize=True)

        # Scroll suave CSS (animação previsível)
        await tab.scroll.to_bottom(humanize=False, smooth=True)
        await asyncio.sleep(1.5)
        await tab.scroll.to_top(humanize=False, smooth=True)

asyncio.run(scroll_to_positions())
```

!!! tip "Escolhendo o Modo Certo"
    - **`humanize=True`**: Melhor para evasão anti-bot
    - **Padrão** (`smooth=True`): Bom para demos, screenshots e automação geral
    - **`smooth=False`**: Velocidade máxima quando a furtividade não é uma preocupação

### Padrões de Rolagem Semelhantes a Humanos

O motor de scroll do Pydoll usa **Curvas de Bezier Cúbicas** para simular a física da rolagem humana. Isso inclui:

- **Momentum**: Explosão inicial de velocidade seguida de desaceleração gradual.
- **Fricção**: Desaceleração natural baseada em "resistência física".
- **Micro-pausas**: Breves paradas durante scrolls longos, imitando leitura ou movimento dos olhos.
- **Overshoot**: Rolagem ocasional além do alvo e correção de volta.

Este comportamento é automaticamente habilitado quando você usa `humanize=True`.

```python
import asyncio
import random
from pydoll.browser.chromium import Chrome
from pydoll.constants import ScrollPosition

async def human_like_scrolling():
    """Simular padrões de rolagem naturais ao ler um artigo."""
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/article')
        
        # Usuário começa a ler do topo
        await asyncio.sleep(random.uniform(2.0, 4.0))
        
        # Rolar gradualmente enquanto lê
        # O motor de scroll cuida da física (aceleração/desaceleração)
        for _ in range(random.randint(5, 8)):
            # Distâncias de rolagem variadas (simula velocidade de leitura)
            scroll_distance = random.randint(300, 600)
            await tab.scroll.by(
                ScrollPosition.DOWN, 
                scroll_distance, 
                humanize=True  # Habilita física com curvas de Bezier
            )
            
            # Pausar para "ler" o conteúdo
            await asyncio.sleep(random.uniform(2.0, 5.0))
        
        # Scroll rápido para verificar o final
        await tab.scroll.to_bottom(humanize=True)
        await asyncio.sleep(random.uniform(1.0, 2.0))
        
        # Voltar ao topo para reler algo
        await tab.scroll.to_top(humanize=True)

asyncio.run(human_like_scrolling())
```

### Rolando Elementos para a Visão

Use `scroll_into_view()` para garantir que elementos estejam visíveis antes de capturar screenshots da página:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def scroll_for_screenshots():
    """Rolar elementos para a visão antes de capturar screenshots da página."""
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/product')
        
        # Rolar para seção de preços antes de tirar screenshot da página completa
        pricing_section = await tab.find(id="pricing")
        await pricing_section.scroll_into_view()
        await tab.take_screenshot(path="page_with_pricing.png")
        
        # Rolar para seção de avaliações antes do screenshot
        reviews = await tab.find(class_name="reviews")
        await reviews.scroll_into_view()
        await tab.take_screenshot(path="page_with_reviews.png")
        
        # Rolar para rodapé para capturar estado completo da página
        footer = await tab.find(tag_name="footer")
        await footer.scroll_into_view()
        await tab.take_screenshot(path="page_with_footer.png")
        
        # Nota: click() já rola automaticamente, então não é necessário:
        # await button.scroll_into_view()  # Desnecessário!
        # await button.click()  # Isso já rola o botão para a visão

asyncio.run(scroll_for_screenshots())
```

### Detectando Conteúdo de Scroll Infinito

Implemente padrões de rolagem para carregar conteúdo lazy-loaded:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.constants import ScrollPosition

async def infinite_scroll_loading():
    """Carregar conteúdo em páginas com scroll infinito."""
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/feed')
        
        items_loaded = 0
        max_scrolls = 10
        
        for scroll_num in range(max_scrolls):
            # Rolar até o final para acionar carregamento
            await tab.scroll.to_bottom(smooth=True)
            
            # Aguardar o conteúdo carregar
            await asyncio.sleep(random.uniform(2.0, 3.0))
            
            # Verificar se novos itens foram carregados
            items = await tab.find(class_name="feed-item", find_all=True)
            new_count = len(items)
            
            if new_count == items_loaded:
                print("Sem mais conteúdo para carregar")
                break
            
            items_loaded = new_count
            print(f"Rolagem {scroll_num + 1}: {items_loaded} itens carregados")
            
            # Pequena rolagem para cima (comportamento humano)
            if random.random() > 0.7:
                await tab.scroll.by(ScrollPosition.UP, 200, smooth=True)
                await asyncio.sleep(random.uniform(0.5, 1.0))

asyncio.run(infinite_scroll_loading())
```

!!! success "Aguarda Automático da Conclusão"
    Diferentemente de `execute_script("window.scrollBy(...)")` que retorna imediatamente, a API `scroll` usa o parâmetro `awaitPromise` do CDP para aguardar o evento `scrollend` do navegador. Isso garante que suas ações subsequentes só executem após a rolagem terminar completamente.

## Combinando Técnicas para Máximo Realismo

### Exemplo Completo de Preenchimento de Formulário

Aqui está um exemplo abrangente combinando todas as técnicas de interação semelhantes a humanas. **Isso demonstra a abordagem manual atual** para alcançar o máximo realismo. Versões futuras automatizarão muito dessa aleatorização:

```python
import asyncio
import random
from pydoll.browser.chromium import Chrome
from pydoll.constants import Key

async def human_like_form_filling():
    """Preencher um formulário com máximo realismo para evitar detecção."""
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/registration')
        
        # Esperar um pouco (usuário lendo a página)
        await asyncio.sleep(random.uniform(1.5, 3.0))
        
        # Preencher o primeiro nome com velocidade de digitação variável
        first_name = await tab.find(id="first-name")
        await first_name.click(
            x_offset=random.randint(-5, 5),
            y_offset=random.randint(-5, 5)
        )
        await asyncio.sleep(random.uniform(0.2, 0.5))
        
        # Digitação manual caractere por caractere com atrasos aleatórios
        # (Isso será automatizado em versões futuras)
        name_text = "John"
        for char in name_text:
            await first_name.type_text(char, interval=0)
            await asyncio.sleep(random.uniform(0.08, 0.22))
        
        # Tab para o próximo campo
        await asyncio.sleep(random.uniform(0.3, 0.8))
        await first_name.press_keyboard_key(Key.TAB)
        
        # Preencher o sobrenome
        await asyncio.sleep(random.uniform(0.2, 0.5))
        last_name = await tab.find(id="last-name")
        await last_name.type_text("Doe", interval=random.uniform(0.1, 0.18))
        
        # Tab para o email
        await asyncio.sleep(random.uniform(0.4, 1.0))
        await last_name.press_keyboard_key(Key.TAB)
        
        # Preencher email com pausas realistas
        await asyncio.sleep(random.uniform(0.2, 0.5))
        email = await tab.find(id="email")
        
        email_text = "john.doe@example.com"
        for i, char in enumerate(email_text):
            await email.type_text(char, interval=0)
            # Pausa mais longa nos símbolos @ e . (natural)
            if char in ['@', '.']:
                await asyncio.sleep(random.uniform(0.2, 0.4))
            else:
                await asyncio.sleep(random.uniform(0.08, 0.2))
        
        # Simular usuário revisando o que digitou
        await asyncio.sleep(random.uniform(1.0, 2.5))
        
        # Aceitar checkbox de termos com deslocamento
        terms_checkbox = await tab.find(id="accept-terms")
        await terms_checkbox.click(
            x_offset=random.randint(-3, 3),
            y_offset=random.randint(-3, 3),
            hold_time=random.uniform(0.08, 0.15)
        )
        
        # Pausar antes de enviar (usuário revisando formulário)
        await asyncio.sleep(random.uniform(1.5, 3.0))
        
        # Clicar em enviar com parâmetros realistas
        submit_button = await tab.find(tag_name="button", type="submit")
        await submit_button.click(
            x_offset=random.randint(-8, 8),
            y_offset=random.randint(-5, 5),
            hold_time=random.uniform(0.1, 0.2)
        )
        
        print("Formulário enviado com comportamento semelhante ao humano")

asyncio.run(human_like_form_filling())
```

## Melhores Práticas para Evitar Detecção

!!! tip "Aleatorização Manual Atualmente Necessária"
    As seguintes melhores práticas representam o **estado atual do Pydoll**, onde você deve implementar a aleatorização manualmente. Embora isso exija mais código, oferece um controle refinado sobre o comportamento. Versões futuras automatizarão esses padrões, mantendo o mesmo nível de realismo.

### 1. Sempre Adicione Atrasos Aleatórios

```python
import asyncio
import random
from pydoll.browser.chromium import Chrome

# Ruim: Tempo previsível
await element1.click()
await element2.click()
await element3.click()

# Bom: Tempo variável (atualmente necessário)
await element1.click()
await asyncio.sleep(random.uniform(0.5, 1.5))
await element2.click()
await asyncio.sleep(random.uniform(0.8, 2.0))
await element3.click()
```

### 2. Varie as Posições dos Cliques

```python
import asyncio
import random
from pydoll.browser.chromium import Chrome

# Ruim: Sempre clica no centro
for button in buttons:
    await button.click()

# Bom: Posições variadas (atualmente manual)
for button in buttons:
    await button.click(
        x_offset=random.randint(-10, 10),
        y_offset=random.randint(-10, 10)
    )
```

### 3. Simule Comportamento Natural do Usuário

```python
import asyncio
import random
from pydoll.browser.chromium import Chrome

async def natural_user_simulation(tab):
    # Usuário chega na página
    await tab.go_to('https://example.com')
    
    # Usuário lê o conteúdo da página (1-3 segundos)
    await asyncio.sleep(random.uniform(1.0, 3.0))
    
    # Usuário rola para baixo para ver mais
    await tab.scroll.by(ScrollPosition.DOWN, 300, smooth=True)
    await asyncio.sleep(random.uniform(0.5, 1.5))
    
    # Usuário encontra e clica no botão
    button = await tab.find(class_name="cta-button")
    await button.click(
        x_offset=random.randint(-5, 5),
        y_offset=random.randint(-5, 5)
    )
    
    # Usuário espera o conteúdo carregar
    await asyncio.sleep(random.uniform(0.8, 1.5))
```

### 4. Combine Múltiplas Técnicas

```python
import asyncio
import random
from pydoll.browser.chromium import Chrome

async def advanced_stealth_automation():
    """Combinar múltiplas técnicas para máxima furtividade."""
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Usar espera de carregamento de página semelhante à humana
        await tab.go_to('https://example.com/sensitive-page')
        await asyncio.sleep(random.uniform(2.0, 4.0))
        
        # Rolar realisticamente com a API dedicada
        for _ in range(random.randint(2, 4)):
            scroll_amount = random.randint(200, 500)
            await tab.scroll.by(ScrollPosition.DOWN, scroll_amount, smooth=True)
            await asyncio.sleep(random.uniform(0.8, 2.0))
        
        # Encontrar elemento com timeout (simulando busca do usuário)
        target = await tab.find(
            class_name="target-element",
            timeout=random.randint(3, 7)
        )
        
        # Clicar com todos os parâmetros realistas
        await target.click(
            x_offset=random.randint(-12, 12),
            y_offset=random.randint(-8, 8),
            hold_time=random.uniform(0.09, 0.18)
        )
        
        # Tempo de reação humano
        await asyncio.sleep(random.uniform(0.5, 1.2))

asyncio.run(advanced_stealth_automation())
```

## Trocas entre Desempenho e Realismo

Às vezes, você precisa equilibrar velocidade com realismo:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def balanced_automation():
    """Escolher o nível de realismo apropriado com base no contexto."""
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/scraping-target')
        
        # Fase 1: Interação inicial (alto realismo)
        # É quando os sistemas de detecção estão mais ativos
        login_button = await tab.find(text="Login")
        await asyncio.sleep(random.uniform(1.0, 2.0))
        await login_button.click(
            x_offset=random.randint(-5, 5),
            y_offset=random.randint(-5, 5)
        )
        
        await asyncio.sleep(random.uniform(0.5, 1.0))
        
        username = await tab.find(id="username")
        await username.type_text("user@example.com", interval=0.12)
        
        await asyncio.sleep(random.uniform(0.3, 0.7))
        
        password = await tab.find(id="password")
        await password.type_text("password123", interval=0.10)
        
        submit = await tab.find(type="submit")
        await asyncio.sleep(random.uniform(0.8, 1.5))
        await submit.click()
        
        # Fase 2: Extração de dados autenticada (menos realismo, mais velocidade)
        # Menos escrutínio após autenticação bem-sucedida
        await asyncio.sleep(2)
        
        # Navegação rápida pelas páginas
        items = await tab.find(class_name="data-item", find_all=True)
        
        for item in items:
            # Clique rápido sem deslocamentos
            await item.click_using_js()
            await asyncio.sleep(0.3)  # Atraso mínimo
            
            # Extrair dados
            title = await tab.find(class_name="title")
            data = await title.text
            
            # Navegação rápida
            await tab.execute_script("window.history.back()")
            await asyncio.sleep(0.5)

asyncio.run(balanced_automation())
```

## Monitorando e Ajustando

Teste o realismo da sua automação:

```python
import asyncio
import random
import time
from pydoll.browser.chromium import Chrome

async def test_interaction_timing():
    """Registrar tempos para garantir padrões realistas."""
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/test-page')
        
        # Medir e registrar o tempo de interação
        elements = await tab.find(class_name="clickable", find_all=True)
        
        timings = []
        last_time = time.time()
        
        for i, element in enumerate(elements):
            await element.click(
                x_offset=random.randint(-8, 8),
                y_offset=random.randint(-8, 8)
            )
            
            current_time = time.time()
            elapsed = current_time - last_time
            timings.append(elapsed)
            
            print(f"Clique {i+1}: {elapsed:.3f}s desde a última ação")
            last_time = current_time
            
            await asyncio.sleep(random.uniform(0.5, 2.0))
        
        # Analisar distribuição de tempo
        avg_time = sum(timings) / len(timings)
        print(f"\nTempo médio entre ações: {avg_time:.3f}s")
        print(f"Min: {min(timings):.3f}s, Max: {max(timings):.3f}s")
        
        # Bom: Tempo variável com média realista (1-2 segundos)
        # Ruim: Tempo constante ou irrealisticamente rápido (<0.1s)

asyncio.run(test_interaction_timing())
```

## Aprenda Mais

Para mais informações sobre métodos de interação com elementos:

- **[Localização de Elementos](../element-finding.md)**: Localize elementos para interagir
- **[Domínio WebElement](../../deep-dive/webelement-domain.md)**: Análise profunda das capacidades do WebElement
- **[Operações com Arquivos](file-operations.md)**: Faça upload de arquivos e lide com downloads

Domine as interações semelhantes a humanas, e sua automação será mais confiável, mais difícil de detectar e espelhará mais de perto o comportamento real do usuário.

================================================
FILE: docs/pt/features/automation/iframes.md
================================================
# Trabalhando com IFrames

Páginas modernas usam `<iframe>` para embutir outros documentos. Nas versões antigas do Pydoll era necessário transformar o iframe em uma `Tab` com `tab.get_frame()` e cuidar de alvos CDP manualmente. **Isso acabou.**  
Agora um iframe se comporta como qualquer outro `WebElement`: você pode chamar `find()`, `query()`, `execute_script()`, `inner_html`, `text` e todos os utilitários diretamente — o Pydoll encaminha a operação para o contexto correto em qualquer domínio.

!!! info "Modelo mental simples"
    Pense no iframe como mais uma `div`. Localize o elemento, guarde a referência e continue a navegação a partir dele. O Pydoll se encarrega de criar o mundo isolado, configurar o contexto JavaScript e lidar com iframes aninhados automaticamente.

## Guia rápido

### Interagir com o primeiro iframe da página

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def interagir_iframe():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/page-with-iframe')

        iframe = await tab.find(tag_name='iframe', id='content-frame')

        # As chamadas abaixo já executam dentro do iframe
        title = await iframe.find(tag_name='h1')
        await title.click()

        form = await iframe.find(id='login-form')
        username = await form.find(name='username')
        await username.type_text('john_doe')

asyncio.run(interagir_iframe())
```

### Iframes aninhados

Basta encadear as buscas:

```python
outer = await tab.find(id='outer-frame')
inner = await outer.find(tag_name='iframe')  # procura dentro do primeiro iframe

submit_button = await inner.find(id='submit')
await submit_button.click()
```

O fluxo é sempre o mesmo:

1. Localize o iframe desejado.
2. Use esse `WebElement` como escopo das próximas buscas.
3. Repita para níveis mais profundos, se necessário.

### Executar JavaScript dentro do iframe

```python
iframe = await tab.find(tag_name='iframe')
result = await iframe.execute_script('return document.title', return_by_value=True)
print(result['result']['result']['value'])
```

O Pydoll garante que o script rode no contexto isolado do iframe, inclusive em frames cross-origin.

## Por que ficou melhor?

- **Intuitivo:** você programa exatamente o que vê na árvore DOM.
- **Sem dor de cabeça com CDP:** mundos isolados e targets são configurados automaticamente.
- **Suporte nativo a aninhamento:** cada busca é relativa ao elemento atual; hierarquias profundas continuam legíveis.
- **Uma única API:** não é preciso alternar entre métodos de `Tab` e de `WebElement`.

!!! tip "Aviso de descontinuação"
    `Tab.get_frame()` agora emite `DeprecationWarning` e será removido em uma versão futura. Atualize seus scripts para usar o iframe diretamente, como mostrado acima.

## Padrões comuns

### Capturar imagem de conteúdo dentro do iframe

```python
iframe = await tab.find(tag_name='iframe')
chart = await iframe.find(id='sales-chart')
await chart.take_screenshot('chart.png')
```

### Iterar sobre vários iframes

```python
iframes = await tab.find(tag_name='iframe', find_all=True)
for frame in iframes:
    heading = await frame.find(tag_name='h2')
    print(await heading.text)
```

### Aguardar até que um iframe esteja pronto

```python
iframe = await tab.find(tag_name='iframe')
await iframe.wait_until(is_visible=True, timeout=10)
banner = await iframe.find(id='promo-banner')
```

## Seletores que Cruzam IFrames

Em vez de localizar manualmente cada iframe e depois buscar dentro dele, você pode escrever um **único seletor** que cruza as fronteiras do iframe. O Pydoll detecta automaticamente os passos `iframe` no seu XPath ou CSS, divide em segmentos e percorre a cadeia de iframes por você.

### Seletores CSS

Use qualquer combinador padrão (`>`, espaço) após um composto `iframe`:

```python
# Cruzamento de um único iframe
button = await tab.query('iframe > .submit-btn')

# Com seletores de atributo no iframe
button = await tab.query('iframe[src*="checkout"] > #pay-button')

# Iframes aninhados
element = await tab.query('iframe.outer > iframe.inner > div.content')

# Múltiplos passos após o iframe
link = await tab.query('iframe > nav > a.home-link')

# Iframe dentro de outro elemento (não na raiz)
button = await tab.query('div > iframe > button.submit')
content = await tab.query('.wrapper iframe > div.content')
```

### Expressões XPath

Use `/` após um passo `iframe` — o Pydoll divide no nó do iframe:

```python
# Cruzamento de um único iframe
button = await tab.query('//iframe/body/button[@id="submit"]')

# Iframe dentro de outro elemento (não na raiz)
div = await tab.query('//div/iframe/div')
item = await tab.query('//div[@class="wrapper"]/iframe/body/div')

# Com predicados no iframe
heading = await tab.query('//iframe[@src*="cloudflare"]//h1')

# Iframes aninhados
element = await tab.query('//iframe[@id="outer"]//iframe[@id="inner"]//div')
```

### Como funciona

Quando o Pydoll encontra um seletor como `iframe[src*="checkout"] > form > button`:

1. **Analisa** o seletor em segmentos: `iframe[src*="checkout"]` e `form > button`
2. **Encontra** o elemento iframe usando o primeiro segmento
3. **Busca dentro** do iframe usando o segundo segmento
4. Para iframes aninhados, repete o processo em cada fronteira

Isso equivale à abordagem manual, mas em uma única chamada:

```python
# Manual (continua funcionando)
iframe = await tab.find(tag_name='iframe', src='*checkout*')
button = await iframe.query('form > button')

# Automático (mesmo resultado, uma linha)
button = await tab.query('iframe[src*="checkout"] > form > button')
```

### Quando a divisão NÃO acontece

Seletores só são divididos quando `iframe` aparece como **nome de tag**. Estes seletores passam inalterados:

- `.iframe > body` — seletor de classe, não de tag
- `#iframe > body` — seletor de ID
- `div.iframe > body` — tag é `div`, não `iframe`
- `[data-type="iframe"] > body` — seletor de atributo
- `iframe` ou `//iframe` — sem conteúdo após o iframe (nada para buscar dentro)

### Suporte a find_all

O último segmento respeita `find_all=True`, retornando todos os elementos correspondentes dentro do iframe final:

```python
# Obter todos os links dentro de um iframe
links = await tab.query('iframe > a', find_all=True)
```

## Boas práticas

- **Use o iframe como escopo:** prefira chamar `find`, `query` e derivados diretamente nele.
- **Evite `tab.find` para elementos internos:** ele só enxerga o documento principal.
- **Guarde referências úteis:** o contexto é cacheado pelo Pydoll.
- **Continue aplicando os mesmos fluxos:** rolagem, screenshots, waits, scripts, atributos e texto funcionam igual a qualquer outro elemento.

## Leituras recomendadas

- **[Busca de Elementos](../element-finding.md)** – explica buscas encadeadas e escopos.
- **[Capturas e PDFs](screenshots-and-pdfs.md)** – detalhes sobre captura de tela.
- **[Event System](../advanced/event-system.md)** – monitore eventos de forma reativa (inclusive de iframes).

Com o novo fluxo, iframes deixam de ser um caso especial: são apenas mais um nó na árvore DOM. Concentre-se na lógica da automação; o Pydoll cuida da parte difícil para você.


================================================
FILE: docs/pt/features/automation/keyboard-control.md
================================================
# Controle de Teclado

A API de Teclado fornece controle completo sobre a entrada de teclado no nível da página, permitindo que você simule digitação realista, execute atalhos e controle sequências complexas de teclas. Diferente dos métodos de teclado em nível de elemento, a API de Teclado opera globalmente na página, dando a você a flexibilidade de interagir com qualquer elemento focado ou acionar ações de teclado em nível de página.

!!! info "Interface de Teclado Centralizada"
    Todas as operações de teclado são acessíveis via `tab.keyboard`, fornecendo uma API limpa e unificada para todas as interações de teclado.

!!! warning "Limitação Importante do CDP: Atalhos de UI do Navegador Não Funcionam"
    **Problema Conhecido**: Eventos injetados via Chrome DevTools Protocol são marcados como "não confiáveis" e **não** acionam ações da UI do navegador ou criam gestos de usuário.
    
    **O que NÃO funciona:**

    - Atalhos do navegador (Ctrl+T, Ctrl+W, Ctrl+N)
    - Atalhos de DevTools (F12, Ctrl+Shift+I)
    - Navegação do navegador (Ctrl+Shift+T para reabrir abas)
    - Qualquer atalho que modifica a UI ou janelas do navegador
    
    **O que funciona perfeitamente:**

    - Atalhos em nível de página (Ctrl+A, Ctrl+C, Ctrl+V, Ctrl+F)
    - Seleção e manipulação de texto
    - Navegação em formulários (Tab, Enter, teclas de seta)
    - Interações com campos de entrada
    - Atalhos personalizados de aplicações (em web apps)
    
    **Razão técnica**: Eventos CDP não criam "gestos de usuário" necessários pela segurança do navegador. Veja [chromium issue #615341](https://bugs.chromium.org/p/chromium/issues/detail?id=615341) e [documentação CDP](https://chromedevtools.github.io/devtools-protocol/tot/Input/#method-dispatchKeyEvent).
    
    Para automação em nível de navegador, use comandos CDP do navegador diretamente (como `tab.close()`, `browser.new_tab()`) ao invés de atalhos de teclado.

## Início Rápido

A API de Teclado fornece três métodos principais:

```python
from pydoll.browser import Chrome
from pydoll.constants import Key

async with Chrome() as browser:
    tab = await browser.start()
    await tab.go_to('https://example.com')
    
    # Pressionar e soltar uma tecla
    await tab.keyboard.press(Key.ENTER)
    
    # Executar uma combinação de atalho
    await tab.keyboard.hotkey(Key.CONTROL, Key.S)  # Ctrl+S
    
    # Controle manual
    await tab.keyboard.down(Key.SHIFT)
    await tab.keyboard.press(Key.ARROWRIGHT)
    await tab.keyboard.up(Key.SHIFT)
```

## Métodos Principais

### Press: Ação Completa de Tecla

O método `press()` executa um ciclo completo de pressionamento de tecla (pressionar → aguardar → soltar):

```python
from pydoll.constants import Key

# Pressionamento básico de tecla
await tab.keyboard.press(Key.ENTER)
await tab.keyboard.press(Key.TAB)
await tab.keyboard.press(Key.ESCAPE)

# Pressionar com modificadores
await tab.keyboard.press(Key.S, modifiers=2)  # Ctrl+S (modificador manual)

# Duração personalizada de manutenção
await tab.keyboard.press(Key.SPACE, interval=0.5)  # Manter por 500ms
```

**Parâmetros:**

- `key`: Tecla a ser pressionada (do enum `Key`)
- `modifiers` (opcional): Flags de modificadores (Alt=1, Ctrl=2, Meta=4, Shift=8)
- `interval` (opcional): Duração para manter a tecla em segundos (padrão: 0.1)

### Down: Pressionar Tecla Sem Soltar

O método `down()` pressiona uma tecla sem soltá-la, útil para manter modificadores ou criar sequências de teclas:

```python
from pydoll.constants import Key

# Manter Shift enquanto pressiona outras teclas
await tab.keyboard.down(Key.SHIFT)
await tab.keyboard.press(Key.ARROWRIGHT)  # Selecionar texto
await tab.keyboard.press(Key.ARROWRIGHT)  # Continuar selecionando
await tab.keyboard.up(Key.SHIFT)

# Pressionar com flags de modificador
await tab.keyboard.down(Key.A, modifiers=2)  # Ctrl+A (selecionar tudo)
```

**Parâmetros:**
- `key`: Tecla a ser pressionada
- `modifiers` (opcional): Flags de modificadores a aplicar

### Up: Soltar uma Tecla

O método `up()` solta uma tecla previamente pressionada:

```python
from pydoll.constants import Key

# Sequência manual de teclas
await tab.keyboard.down(Key.CONTROL)
await tab.keyboard.down(Key.SHIFT)
await tab.keyboard.press(Key.T)  # Ctrl+Shift+T
await tab.keyboard.up(Key.SHIFT)
await tab.keyboard.up(Key.CONTROL)
```

**Parâmetros:**
- `key`: Tecla a ser solta

!!! tip "Quando Usar Cada Método"

    - **`press()`**: Ações de tecla única (Enter, Tab, letras)
    - **`hotkey()`**: Atalhos de teclado (Ctrl+C, Ctrl+Shift+T)
    - **`down()`/`up()`**: Sequências complexas, manter modificadores, temporização personalizada

## Hotkeys: Atalhos de Teclado Simplificados

O método `hotkey()` detecta automaticamente teclas modificadoras e executa atalhos corretamente:

### Hotkeys Básicos

```python
from pydoll.constants import Key

# Atalhos comuns
await tab.keyboard.hotkey(Key.CONTROL, Key.C)  # Copiar
await tab.keyboard.hotkey(Key.CONTROL, Key.V)  # Colar
await tab.keyboard.hotkey(Key.CONTROL, Key.X)  # Recortar
await tab.keyboard.hotkey(Key.CONTROL, Key.Z)  # Desfazer
await tab.keyboard.hotkey(Key.CONTROL, Key.Y)  # Refazer
await tab.keyboard.hotkey(Key.CONTROL, Key.A)  # Selecionar tudo
await tab.keyboard.hotkey(Key.CONTROL, Key.S)  # Salvar

```

### Combinações de Três Teclas

```python
from pydoll.constants import Key

# Atalhos de edição de texto (estes funcionam!)
await tab.keyboard.hotkey(Key.CONTROL, Key.SHIFT, Key.ARROWLEFT)  # Selecionar palavra à esquerda
await tab.keyboard.hotkey(Key.CONTROL, Key.SHIFT, Key.ARROWRIGHT)  # Selecionar palavra à direita
await tab.keyboard.hotkey(Key.CONTROL, Key.SHIFT, Key.HOME)  # Selecionar até o início do documento
await tab.keyboard.hotkey(Key.CONTROL, Key.SHIFT, Key.END)  # Selecionar até o fim do documento

# Atalhos específicos de aplicação (se suportados pelo web app)
await tab.keyboard.hotkey(Key.CONTROL, Key.SHIFT, Key.Z)  # Refazer em muitos apps
await tab.keyboard.hotkey(Key.CONTROL, Key.SHIFT, Key.S)  # Salvar Como (se o app suportar)
```

### Atalhos Específicos de Plataforma

```python
import sys
from pydoll.constants import Key

# Usar Meta (Command) no macOS, Control no Windows/Linux
modifier = Key.META if sys.platform == 'darwin' else Key.CONTROL

await tab.keyboard.hotkey(modifier, Key.C)  # Copiar (consciente da plataforma)
await tab.keyboard.hotkey(modifier, Key.V)  # Colar (consciente da plataforma)
```

### Como Funcionam os Hotkeys

O método `hotkey()` lida inteligentemente com teclas modificadoras:

1. **Detecta modificadores**: Identifica automaticamente Ctrl, Shift, Alt, Meta
2. **Calcula flags**: Combina modificadores usando OR bit a bit (Ctrl=2, Shift=8 → 10)
3. **Aplica corretamente**: Pressiona teclas não-modificadoras com flags de modificador aplicadas
4. **Liberação limpa**: Solta teclas em ordem reversa

```python
from pydoll.constants import Key

# Nos bastidores para hotkey(Key.CONTROL, Key.SHIFT, Key.T):
# 1. Detecta: modifiers=[CONTROL, SHIFT], keys=[T]
# 2. Calcula: modifier_value = 2 | 8 = 10
# 3. Executa: pressiona T com modifiers=10
# 4. Libera: solta T
```

!!! tip "Valores de Modificador"
    Ao usar o parâmetro `modifiers` manualmente:

    - Alt = 1
    - Ctrl = 2
    - Meta/Command = 4
    - Shift = 8
    
    Combine-os: Ctrl+Shift = 2 + 8 = 10

## Teclas Disponíveis

O enum `Key` fornece cobertura abrangente do teclado:

### Teclas de Letras (A-Z)

```python
from pydoll.constants import Key

# Todas as letras A a Z
await tab.keyboard.press(Key.A)
await tab.keyboard.press(Key.Z)
```

### Teclas Numéricas

```python
from pydoll.constants import Key

# Números da linha superior (0-9)
await tab.keyboard.press(Key.DIGIT0)
await tab.keyboard.press(Key.DIGIT9)

# Números do teclado numérico
await tab.keyboard.press(Key.NUMPAD0)
await tab.keyboard.press(Key.NUMPAD9)
```

### Teclas de Função

```python
from pydoll.constants import Key

# F1 até F12
await tab.keyboard.press(Key.F1)
await tab.keyboard.press(Key.F12)
```

### Teclas de Navegação

```python
from pydoll.constants import Key

await tab.keyboard.press(Key.ARROWUP)
await tab.keyboard.press(Key.ARROWDOWN)
await tab.keyboard.press(Key.ARROWLEFT)
await tab.keyboard.press(Key.ARROWRIGHT)
await tab.keyboard.press(Key.HOME)
await tab.keyboard.press(Key.END)
await tab.keyboard.press(Key.PAGEUP)
await tab.keyboard.press(Key.PAGEDOWN)
```

### Teclas Modificadoras

```python
from pydoll.constants import Key

await tab.keyboard.press(Key.CONTROL)
await tab.keyboard.press(Key.SHIFT)
await tab.keyboard.press(Key.ALT)
await tab.keyboard.press(Key.META)  # Command no macOS, tecla Windows no Windows
```

### Teclas Especiais

```python
from pydoll.constants import Key

await tab.keyboard.press(Key.ENTER)
await tab.keyboard.press(Key.TAB)
await tab.keyboard.press(Key.SPACE)
await tab.keyboard.press(Key.BACKSPACE)
await tab.keyboard.press(Key.DELETE)
await tab.keyboard.press(Key.ESCAPE)
await tab.keyboard.press(Key.INSERT)
```

## Exemplos Práticos

### Navegação em Formulários

```python
from pydoll.browser import Chrome
from pydoll.constants import Key

async def fill_form_with_keyboard():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/form')
        
        # Focar no primeiro campo e digitar
        first_field = await tab.find(id='name')
        await first_field.click()
        await first_field.insert_text('João Silva')
        
        # Navegar para o próximo campo com Tab
        await tab.keyboard.press(Key.TAB)
        await tab.keyboard.press(Key.TAB)  # Pular um campo
        
        # Digitar no campo atualmente focado
        second_field = await tab.find(id='email')
        await second_field.insert_text('joao@example.com')
        
        # Enviar com Enter
        await tab.keyboard.press(Key.ENTER)
```

### Seleção e Manipulação de Texto

```python
from pydoll.constants import Key

async def select_and_replace_text():
    # Selecionar todo o texto
    await tab.keyboard.hotkey(Key.CONTROL, Key.A)
    
    # Copiar seleção
    await tab.keyboard.hotkey(Key.CONTROL, Key.C)
    
    # Mover para o fim
    await tab.keyboard.press(Key.END)
    
    # Selecionar palavra por palavra
    await tab.keyboard.down(Key.CONTROL)
    await tab.keyboard.down(Key.SHIFT)
    await tab.keyboard.press(Key.ARROWLEFT)
    await tab.keyboard.press(Key.ARROWLEFT)
    await tab.keyboard.up(Key.SHIFT)
    await tab.keyboard.up(Key.CONTROL)
    
    # Deletar seleção
    await tab.keyboard.press(Key.DELETE)
```

### Navegação em Dropdown e Select

```python
from pydoll.constants import Key

async def navigate_dropdown():
    # Abrir dropdown
    select = await tab.find(tag_name='select')
    await select.click()
    
    # Navegar opções com teclas de seta
    await tab.keyboard.press(Key.ARROWDOWN)
    await tab.keyboard.press(Key.ARROWDOWN)
    
    # Selecionar com Enter
    await tab.keyboard.press(Key.ENTER)
    
    # Ou cancelar com Escape
    await tab.keyboard.press(Key.ESCAPE)
```

### Sequências Complexas de Teclas

```python
from pydoll.constants import Key
import asyncio

async def complex_editing():
    # Selecionar linha
    await tab.keyboard.press(Key.HOME)  # Ir para o início
    await tab.keyboard.down(Key.SHIFT)
    await tab.keyboard.press(Key.END)  # Selecionar até o fim
    await tab.keyboard.up(Key.SHIFT)
    
    # Recortar
    await tab.keyboard.hotkey(Key.CONTROL, Key.X)
    
    # Mover para baixo e colar
    await tab.keyboard.press(Key.ARROWDOWN)
    await tab.keyboard.hotkey(Key.CONTROL, Key.V)
    
    # Desfazer se necessário
    await tab.keyboard.hotkey(Key.CONTROL, Key.Z)
```

## Melhores Práticas

### 1. Adicione Atrasos para Confiabilidade

```python
from pydoll.constants import Key
import asyncio

# Bom: Aguardar atualização da UI
await tab.keyboard.hotkey(Key.CONTROL, Key.F)  # Abrir busca
await asyncio.sleep(0.2)  # Aguardar diálogo
await tab.keyboard.press(Key.ESCAPE)  # Fechá-lo

# Ruim: Sem atraso, pode não funcionar
await tab.keyboard.hotkey(Key.CONTROL, Key.F)
await tab.keyboard.press(Key.ESCAPE)  # Pode ser rápido demais
```

### 2. Focar Elementos Antes de Digitar

```python
from pydoll.constants import Key

# Bom: Garantir que o elemento está focado
input_field = await tab.find(id='search')
await input_field.click()  # Focá-lo
await input_field.insert_text('consulta')

# Ruim: Entrada de teclado vai para elemento errado
await tab.keyboard.press(Key.A)  # Para onde isso vai?
```

### 3. Use Atalhos Conscientes da Plataforma

```python
import sys
from pydoll.constants import Key

# Bom: Consciente da plataforma
cmd_key = Key.META if sys.platform == 'darwin' else Key.CONTROL
await tab.keyboard.hotkey(cmd_key, Key.C)

# Ruim: Hardcoded (não funcionará no macOS)
await tab.keyboard.hotkey(Key.CONTROL, Key.C)
```

### 4. Limpe Sequências Longas

```python
from pydoll.constants import Key

# Bom: Garantir que modificadores sejam liberados
try:
    await tab.keyboard.down(Key.SHIFT)
    await tab.keyboard.press(Key.ARROWRIGHT)
    # ... mais operações
finally:
    await tab.keyboard.up(Key.SHIFT)  # Sempre liberar

# Ruim: Modificador fica pressionado em erro
await tab.keyboard.down(Key.SHIFT)
await tab.keyboard.press(Key.ARROWRIGHT)
# Erro aqui deixa Shift pressionado!
```

## Tabelas de Referência de Teclas

### Atalhos Comuns em Nível de Página (Estes Funcionam!)

| Ação | Windows/Linux | macOS | Notas |
|------|--------------|-------|-------|
| Copiar | Ctrl+C | Cmd+C | Funciona |
| Colar | Ctrl+V | Cmd+V | Funciona |
| Recortar | Ctrl+X | Cmd+X | Funciona |
| Desfazer | Ctrl+Z | Cmd+Z | Funciona |
| Refazer | Ctrl+Y | Cmd+Y | Funciona |
| Selecionar Tudo | Ctrl+A | Cmd+A | Funciona |
| Localizar | Ctrl+F | Cmd+F | Apenas se o web app implementar |
| Salvar | Ctrl+S | Cmd+S | Apenas se o web app implementar |
| Atualizar | F5 ou Ctrl+R | Cmd+R | Use `await tab.refresh()` |

### Atalhos do Navegador (Estes NÃO Funcionam via CDP)

| Ação | Atalho | Use Ao Invés |
|------|--------|--------------|
| Nova Aba | Ctrl+T | `await browser.new_tab()` |
| Fechar Aba | Ctrl+W | `await tab.close()` |
| Reabrir Aba | Ctrl+Shift+T | Rastreie abas manualmente |
| DevTools | F12, Ctrl+Shift+I | Já disponível via CDP! |
| Barra de Endereço | Ctrl+L | `await tab.go_to(url)` |

### Todas as Teclas Disponíveis

| Categoria | Teclas |
|-----------|--------|
| **Letras** | `Key.A` até `Key.Z` (26 teclas) |
| **Números** | `Key.DIGIT0` até `Key.DIGIT9` (10 teclas) |
| **Teclado Numérico** | `Key.NUMPAD0` até `Key.NUMPAD9`, `NUMPADMULTIPLY`, `NUMPADADD`, `NUMPADSUBTRACT`, `NUMPADDECIMAL`, `NUMPADDIVIDE` |
| **Função** | `Key.F1` até `Key.F12` (12 teclas) |
| **Navegação** | `ARROWUP`, `ARROWDOWN`, `ARROWLEFT`, `ARROWRIGHT`, `HOME`, `END`, `PAGEUP`, `PAGEDOWN` |
| **Modificadores** | `CONTROL`, `SHIFT`, `ALT`, `META` |
| **Especiais** | `ENTER`, `TAB`, `SPACE`, `BACKSPACE`, `DELETE`, `ESCAPE`, `INSERT` |
| **Bloqueios** | `CAPSLOCK`, `NUMLOCK`, `SCROLLLOCK` |
| **Símbolos** | `SEMICOLON`, `EQUALSIGN`, `COMMA`, `MINUS`, `PERIOD`, `SLASH`, `GRAVEACCENT`, `BRACKETLEFT`, `BACKSLASH`, `BRACKETRIGHT`, `QUOTE` |

### Valores de Flag de Modificador

| Modificador | Valor | Binário | Uso |
|-------------|-------|---------|-----|
| Alt | 1 | 0001 | `modifiers=1` |
| Ctrl | 2 | 0010 | `modifiers=2` |
| Meta | 4 | 0100 | `modifiers=4` |
| Shift | 8 | 1000 | `modifiers=8` |
| Ctrl+Shift | 10 | 1010 | `modifiers=10` |
| Ctrl+Alt | 3 | 0011 | `modifiers=3` |
| Ctrl+Shift+Alt | 11 | 1011 | `modifiers=11` |

## Migração dos Métodos WebElement

Os métodos de teclado anteriores em `WebElement` estão depreciados. Veja como migrar:

### Antigo vs Novo

```python
from pydoll.constants import Key

# Antigo (depreciado)
element = await tab.find(id='input')
await element.key_down(Key.A, modifiers=2)
await element.key_up(Key.A)
await element.press_keyboard_key(Key.ENTER)

# Novo (recomendado)
await tab.keyboard.down(Key.A, modifiers=2)
await tab.keyboard.up(Key.A)
await tab.keyboard.press(Key.ENTER)
```

!!! warning "Aviso de Depreciação"
    Os seguintes métodos de `WebElement` estão depreciados:

    - `key_down()` → Use `tab.keyboard.down()`
    - `key_up()` → Use `tab.keyboard.up()`
    - `press_keyboard_key()` → Use `tab.keyboard.press()`
    
    Esses métodos ainda funcionam para compatibilidade retroativa, mas mostrarão avisos de depreciação.

### Por Que Migrar?

- **Centralizado**: Todas as operações de teclado em um só lugar
- **API mais limpa**: Interface consistente para todas as ações de teclado
- **Mais poderoso**: Suporte a hotkey, detecção inteligente de modificadores
- **Melhor tipagem**: Suporte completo a autocompletar da IDE

## Saiba Mais

Para capacidades adicionais de automação:

- **[Interações Humanas](human-interactions.md)**: Cliques, rolagem e movimento de mouse realistas
- **[Manipulação de Formulários](form-handling.md)**: Fluxos completos de automação de formulários
- **[Operações com Arquivos](file-operations.md)**: Automação de upload de arquivos

A API de Teclado elimina a complexidade da automação de teclado, fornecendo métodos limpos e confiáveis para tudo, desde pressionamentos simples de teclas até atalhos complexos e sequências.


================================================
FILE: docs/pt/features/automation/mouse-control.md
================================================
# Controle do Mouse

A API de Mouse fornece controle completo sobre a entrada do mouse no nível da página, permitindo simular movimentos realistas do cursor, cliques, cliques duplos e operações de arrastar. Quando `humanize=True` é passado, as operações do mouse usam simulação humanizada: as trajetórias seguem curvas de Bezier naturais com temporização pela Lei de Fitts, perfis de velocidade minimum-jerk, tremor fisiológico e correção de overshoot, tornando a automação virtualmente indistinguível do comportamento humano.

!!! info "Interface Centralizada de Mouse"
    Todas as operações do mouse são acessíveis via `tab.mouse`, fornecendo uma API limpa e unificada para todas as interações com o mouse.

## Início Rápido

```python
from pydoll.browser.chromium import Chrome
from pydoll.protocol.input.types import MouseButton

async with Chrome() as browser:
    tab = await browser.start()
    await tab.go_to('https://example.com')

    # Mover cursor para posição
    await tab.mouse.move(500, 300)

    # Clicar na posição
    await tab.mouse.click(500, 300)

    # Clique direito
    await tab.mouse.click(500, 300, button=MouseButton.RIGHT)

    # Clique duplo
    await tab.mouse.double_click(500, 300)

    # Arrastar de uma posição para outra
    await tab.mouse.drag(100, 200, 500, 400)
```

## Métodos Principais

### move: Mover Cursor

Move o cursor do mouse para uma posição específica na página:

```python
# Movimento padrão (único evento CDP, sem simulação)
await tab.mouse.move(500, 300)

# Movimento humanizado (trajetória curva com temporização natural)
await tab.mouse.move(500, 300, humanize=True)
```

**Parâmetros:**

- `x`: Coordenada X de destino (pixels CSS)
- `y`: Coordenada Y de destino (pixels CSS)
- `humanize` (keyword-only): Simular movimento curvo semelhante ao humano (padrão: `False`)

### click: Clicar na Posição

Move para a posição e realiza um clique do mouse:

```python
from pydoll.protocol.input.types import MouseButton

# Clique esquerdo (padrão, instantâneo)
await tab.mouse.click(500, 300)

# Clique direito
await tab.mouse.click(500, 300, button=MouseButton.RIGHT)

# Clique duplo via click_count
await tab.mouse.click(500, 300, click_count=2)

# Clique humanizado com movimento natural
await tab.mouse.click(500, 300, humanize=True)
```

**Parâmetros:**

- `x`: Coordenada X de destino
- `y`: Coordenada Y de destino
- `button` (keyword-only): Botão do mouse, sendo `LEFT`, `RIGHT` ou `MIDDLE` (padrão: `LEFT`)
- `click_count` (keyword-only): Número de cliques (padrão: `1`)
- `humanize` (keyword-only): Simular comportamento semelhante ao humano (padrão: `False`)

### double_click: Clique Duplo na Posição

Método de conveniência equivalente a `click(x, y, click_count=2)`:

```python
await tab.mouse.double_click(500, 300)
await tab.mouse.double_click(500, 300, humanize=False)
```

### down / up: Controle de Botão de Baixo Nível

Pressionar ou soltar botões do mouse independentemente:

```python
# Pressionar botão esquerdo na posição atual
await tab.mouse.down()

# Soltar botão esquerdo
await tab.mouse.up()

# Botão direito
await tab.mouse.down(button=MouseButton.RIGHT)
await tab.mouse.up(button=MouseButton.RIGHT)
```

Esses são primitivos que operam na posição atual do cursor e não possuem parâmetro `humanize`.

### drag: Arrastar e Soltar

Move do ponto inicial ao final mantendo o botão do mouse pressionado:

```python
# Arrastar padrão (instantâneo)
await tab.mouse.drag(100, 200, 500, 400)

# Arrastar humanizado com movimento natural
await tab.mouse.drag(100, 200, 500, 400, humanize=True)
```

**Parâmetros:**

- `start_x`, `start_y`: Coordenadas iniciais
- `end_x`, `end_y`: Coordenadas finais
- `humanize` (keyword-only): Simular arrasto semelhante ao humano (padrão: `False`)

## Habilitando a Humanização

Todos os métodos do mouse usam `humanize=False` por padrão. Para habilitar simulação humanizada com trajetórias naturais em curvas de Bezier e temporização realista, passe `humanize=True`:

```python
# Movimento humanizado, trajetória curva natural com temporização pela Lei de Fitts
await tab.mouse.move(500, 300, humanize=True)

# Clique humanizado: movimento curvo + pausa pré-clique + press + release
await tab.mouse.click(500, 300, humanize=True)

# Arrasto humanizado, curvas e pausas naturais
await tab.mouse.drag(100, 200, 500, 400, humanize=True)
```

Isso é recomendado quando a evasão de detecção é importante, por exemplo ao interagir com sites que empregam detecção de bots.

## Modo Humanizado

Quando `humanize=True` é passado, o módulo de mouse aplica múltiplas camadas de realismo:

### Trajetórias com Curvas de Bezier

O mouse segue uma trajetória curva natural em vez de uma linha reta. Os pontos de controle são deslocados aleatoriamente perpendiculares à linha início→fim, com posicionamento assimétrico (mais curvatura no início do movimento, como um alcance balístico real).

### Temporização pela Lei de Fitts

A duração do movimento segue a Lei de Fitts: `MT = a + b × log₂(D/W + 1)`. Distâncias maiores levam proporcionalmente mais tempo, correspondendo ao comportamento de controle motor humano.

### Perfil de Velocidade Minimum-Jerk

O cursor segue um perfil de velocidade em forma de sino, iniciando lento, acelerando até a velocidade máxima no meio e depois desacelerando no final. Isso corresponde à trajetória de movimento humano mais suave possível.

### Tremor Fisiológico

Ruído gaussiano pequeno (σ ≈ 1px) é adicionado a cada quadro, simulando tremor da mão. A amplitude do tremor escala inversamente com a velocidade, com mais tremor quando o cursor está lento ou parado e menos durante movimentos balísticos rápidos.

### Overshoot e Correção

Para movimentos rápidos de longa distância (~70% de probabilidade), o cursor ultrapassa o alvo em 3–12% da distância, depois faz um pequeno sub-movimento corretivo de volta ao alvo. Isso corresponde a dados reais de controle motor humano.

### Pausa Pré-Clique

Cliques humanizados incluem uma pausa pré-clique (50–200ms) que simula o tempo natural de estabilização antes de pressionar o botão.

## Cliques Humanizados Automáticos em Elementos

Quando você usa `element.click(humanize=True)`, a API do Mouse é utilizada para produzir um movimento realista com curva de Bezier da posição atual do cursor até o centro do elemento antes de clicar, tornando cliques em elementos indistinguíveis do comportamento humano.

```python
# Clique padrão: press/release CDP bruto
button = await tab.find(id='submit')
await button.click()

# Com deslocamento do centro
await button.click(x_offset=10, y_offset=5)

# Clique humanizado: movimento com curva de Bezier + clique
await button.click(humanize=True)
```

O rastreamento de posição é mantido entre cliques em elementos. Clicar no elemento A, depois no elemento B, produz um caminho curvo natural de A até B.

## Configuração Personalizada de Temporização

Todos os parâmetros de humanização são configuráveis via `MouseTimingConfig`:

```python
from pydoll.interactions.mouse import MouseTimingConfig

config = MouseTimingConfig(
    fitts_a=0.070,              # Intercepto da Lei de Fitts (segundos)
    fitts_b=0.150,              # Inclinação da Lei de Fitts (segundos/bit)
    frame_interval=0.012,       # Intervalo base entre eventos mouseMoved
    curvature_min=0.10,         # Curvatura mínima como fração da distância
    curvature_max=0.30,         # Curvatura máxima
    tremor_amplitude=1.0,       # Sigma do tremor em pixels
    overshoot_probability=0.70, # Chance de overshoot em movimentos rápidos
    min_duration=0.08,          # Duração mínima do movimento
    max_duration=2.5,           # Duração máxima do movimento
)

# Aplicar à instância de mouse do tab
tab.mouse.timing = config
```

Veja o dataclass `MouseTimingConfig` para todos os parâmetros disponíveis.

## Rastreamento de Posição

A API de Mouse rastreia a posição do cursor entre operações:

```python
# Posição inicial é (0, 0)
await tab.mouse.move(100, 200)
# Posição agora é (100, 200)

await tab.mouse.click(300, 400)
# Posição agora é (300, 400)

# Métodos de baixo nível usam a posição rastreada
await tab.mouse.down()   # Pressiona em (300, 400)
await tab.mouse.up()     # Solta em (300, 400)
```

!!! note "Estado da Posição"
    A posição do mouse é rastreada internamente. `WebElement.click()` utiliza automaticamente `tab.mouse` quando disponível, então o rastreamento de posição é mantido entre cliques em elementos.

## Modo Debug

Ative o modo debug para visualizar o movimento do mouse na página. Quando ativo, pontos coloridos são desenhados em um canvas de sobreposição transparente:

- **Pontos azuis**: trajetória do cursor durante o movimento
- **Pontos vermelhos**: posições de clique

```python
# Ativar em tempo de execução via propriedade
tab.mouse.debug = True

# Agora todos os movimentos desenham pontos coloridos
await tab.mouse.click(500, 300)

# Desativar quando terminar
tab.mouse.debug = False
```

Isso é útil para ajustar parâmetros de temporização e verificar que as trajetórias parecem naturais.

## Exemplos Práticos

### Clicar em um Botão com Movimento Realista

```python
async def click_button_naturally(tab):
    # element.click() usa automaticamente tab.mouse para movimento humanizado
    button = await tab.find(id='submit')
    await button.click()
```

### Arrastar um Slider

```python
async def drag_slider(tab):
    slider = await tab.find(css_selector='.slider-handle')
    bounds = await slider.get_bounds_using_js()

    start_x = bounds['x'] + bounds['width'] / 2
    start_y = bounds['y'] + bounds['height'] / 2
    end_x = start_x + 200  # Arrastar 200px para a direita

    await tab.mouse.drag(start_x, start_y, end_x, start_y)
```

### Passar o Mouse Sobre Elementos

```python
async def hover_menu(tab):
    menu = await tab.find(css_selector='.dropdown-trigger')
    bounds = await menu.get_bounds_using_js()

    await tab.mouse.move(
        bounds['x'] + bounds['width'] / 2,
        bounds['y'] + bounds['height'] / 2,
    )
    # O menu agora deve estar visível via CSS :hover
```

## Aprenda Mais

- **[Interações Humanas](human-interactions.md)**: Visão geral de todas as interações humanizadas
- **[Controle de Teclado](keyboard-control.md)**: Simulação realista de teclado


================================================
FILE: docs/pt/features/automation/screenshots-and-pdfs.md
================================================
# Capturas de Tela (Screenshots) e PDFs

O Pydoll oferece poderosas capacidades de captura de tela e geração de PDF através de comandos diretos do Chrome DevTools Protocol. Capture páginas inteiras, elementos específicos ou gere PDFs com controle refinado.

## Capturas de Tela

### Captura de Tela Básica da Página

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def take_page_screenshot():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # Salvar captura de tela em arquivo
        await tab.take_screenshot('page.png', quality=100)

asyncio.run(take_page_screenshot())
```

### Formatos Suportados

O Pydoll suporta três formatos de imagem com base na extensão do arquivo:

```python
# Formato PNG (sem perdas, tamanho de arquivo maior)
await tab.take_screenshot('screenshot.png', quality=100)

# Formato JPEG (com perdas, tamanho de arquivo menor)
await tab.take_screenshot('screenshot.jpeg', quality=85)

# Formato WebP (moderno, eficiente)
await tab.take_screenshot('screenshot.webp', quality=90)
```

!!! info "Detecção de Formato"
    O formato da imagem é determinado automaticamente pela extensão do arquivo. Usar uma extensão não suportada lança `InvalidFileExtension`.
    
    Tanto `.jpg` quanto `.jpeg` são suportados para o formato JPEG (`.jpg` é normalizado automaticamente para `.jpeg` internamente para corresponder aos requisitos do CDP).

### Parâmetros de Captura de Tela

| Parâmetro | Tipo | Padrão | Descrição |
|---|---|---|---|
| `path` | `Optional[str]` | `None` | Caminho do arquivo para salvar a captura de tela. Obrigatório se `as_base64=False`. |
| `quality` | `int` | `100` | Qualidade da imagem (0-100). Valores mais altos significam melhor qualidade e arquivos maiores. |
| `beyond_viewport` | `bool` | `False` | Captura a página inteira rolável, não apenas a área visível. |
| `as_base64` | `bool` | `False` | Retorna a string codificada em base64 em vez de salvar em arquivo. |

### Captura de Tela de Página Inteira

Capture conteúdo além da área visível (viewport):

```python
async def full_page_screenshot():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/long-page')
        
        # Captura a página inteira, incluindo conteúdo abaixo da dobra
        await tab.take_screenshot(
            'full-page.png',
            beyond_viewport=True,
            quality=90
        )
```

!!! warning "Nota de Desempenho"
    Usar `beyond_viewport=True` em páginas muito longas pode consumir memória significativa e levar mais tempo para processar.

### Captura de Tela em Base64

Obtenha a captura de tela como string base64 para incorporar ou enviar via API:

```python
async def base64_screenshot():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # Obter captura de tela como string base64
        screenshot_base64 = await tab.take_screenshot(
            as_base64=True
        )
        
        # Usar em tag img HTML
        html = f'<img src="data:image/png;base64,{screenshot_base64}" />'
        
        # Ou enviar via API
        import aiohttp
        async with aiohttp.ClientSession() as session:
            await session.post(
                'https://api.example.com/upload',
                json={'image': screenshot_base64}
            )
```

### Captura de Tela de Elemento

Capture elementos específicos em vez da página inteira:

```python
async def element_screenshot():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # Capturar um elemento específico (PNG)
        header = await tab.find(tag_name='header')
        await header.take_screenshot('header.png', quality=100)
        
        # Capturar um formulário (JPEG)
        form = await tab.find(id='login-form')
        await form.take_screenshot('login-form.jpeg', quality=85)
        
        # Capturar um gráfico (WebP)
        chart = await tab.find(class_name='data-visualization')
        await chart.take_screenshot('chart.webp', quality=90)
```

!!! info "Detecção de Formato"
    O formato da imagem é detectado automaticamente a partir da extensão do arquivo (`.png`, `.jpeg`/`.jpg`, ou `.webp`). Usar uma extensão não suportada lança `InvalidFileExtension`.

!!! tip "Rolagem Automática"
    Ao capturar screenshots de elementos, o Pydoll rola automaticamente o elemento para a visão antes de tirar a foto.

### Capturas de Tela de Elemento vs Página

| Característica | `tab.take_screenshot()` | `element.take_screenshot()` |
|---|---|---|
| **Escopo** | Viewport inteira ou página | Apenas elemento específico |
| **Suporte a Formato** | PNG, JPEG, WebP | PNG, JPEG, WebP |
| **Além da Viewport** | Suportado | Não aplicável |
| **Saída Base64** | Suportado | Suportado |
| **Auto-Scroll** | Não aplicável | Sim |
| **Caso de Uso** | Capturas de página inteira | Isolamento de componente, testes |


## Geração de PDF

### Exportação Básica de PDF

Converta páginas para PDF com qualidade de impressão:

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def generate_pdf():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/document')
        
        # Gerar PDF com Path
        await tab.print_to_pdf(Path('document.pdf'))
        
        # Ou com string
        await tab.print_to_pdf('document.pdf')

asyncio.run(generate_pdf())
```

### Parâmetros de PDF

| Parâmetro | Tipo | Padrão | Descrição |
|---|---|---|---|
| `path` | `Optional[str \| Path]` | `None` | Caminho do arquivo para salvar o PDF. Obrigatório se `as_base64=False`. |
| `landscape` | `bool` | `False` | Usar orientação paisagem (vs retrato). |
| `display_header_footer` | `bool` | `False` | Incluir cabeçalho/rodapé gerado pelo navegador com título, URL, números de página. |
| `print_background` | `bool` | `True` | Incluir gráficos e cores de fundo. |
| `scale` | `float` | `1.0` | Fator de escala da página (0.1-2.0). Útil para efeitos de zoom/redução. |
| `as_base64` | `bool` | `False` | Retorna string codificada em base64 em vez de salvar em arquivo. |

!!! tip "Path vs String"
    Embora objetos `Path` do `pathlib` sejam recomendados como melhor prática para melhor manipulação de caminhos e compatibilidade entre plataformas, você também pode usar strings simples, se preferir.

### Opções Avançadas de PDF

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def advanced_pdf():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/report')
        
        # PDF paisagem com cabeçalhos/rodapés
        await tab.print_to_pdf(
            Path('report-landscape.pdf'),
            landscape=True,
            display_header_footer=True,
            print_background=True,
            scale=0.9
        )
        
        # PDF retrato sem fundos (amigável à tinta)
        await tab.print_to_pdf(
            Path('report-ink-friendly.pdf'),
            landscape=False,
            print_background=False,
            scale=1.0
        )

asyncio.run(advanced_pdf())
```

### Fator de Escala do PDF

Controle o nível de zoom da saída em PDF:

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def scaled_pdfs():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/content')
        
        # Encolher conteúdo para caber mais em cada página
        await tab.print_to_pdf(Path('compact.pdf'), scale=0.7)
        
        # Escala normal
        await tab.print_to_pdf(Path('normal.pdf'), scale=1.0)
        
        # Ampliar conteúdo (menos páginas)
        await tab.print_to_pdf(Path('large.pdf'), scale=1.5)

asyncio.run(scaled_pdfs())
```

!!! warning "Limites de Escala"
    O parâmetro `scale` aceita valores entre `0.1` e `2.0`. Valores fora dessa faixa podem produzir resultados inesperados.

### PDF em Base64

Gere PDF como string base64 para transmissão via API:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def base64_pdf():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/invoice')
        
        # Obter PDF como base64 (não precisa de caminho)
        pdf_base64 = await tab.print_to_pdf(as_base64=True)
        
        # Enviar via API
        import aiohttp
        async with aiohttp.ClientSession() as session:
            await session.post(
                'https://api.example.com/invoices',
                json={'pdf': pdf_base64}
            )

asyncio.run(base64_pdf())
```


!!! info "Referência do CDP"
    Para documentação completa do CDP sobre esses comandos, veja:
    
    - [Page.captureScreenshot](https://chromedevtools.github.io/devtools-protocol/tot/Page/#method-captureScreenshot)
    - [Page.printToPDF](https://chromedevtools.github.io/devtools-protocol/tot/Page/#method-printToPDF)

### Tratamento de Erros

```python
from pydoll.exceptions import (
    InvalidFileExtension,
    MissingScreenshotPath,
    TopLevelTargetRequired
)

async def safe_screenshot():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        try:
            # Caminho faltando e as_base64=False
            await tab.take_screenshot()
        except MissingScreenshotPath:
            print("Erro: Deve fornecer o caminho ou definir as_base64=True")
        
        try:
            # Extensão inválida
            await tab.take_screenshot('image.bmp')
        except InvalidFileExtension as e:
            print(f"Erro: {e}")
        
        # Limitação de screenshot de IFrame
        iframe_element = await tab.find(tag_name='iframe')

        # Isso ainda não funciona: screenshots de nível superior ignoram iframes
        # await tab.take_screenshot('frame.png')

        # Capture um elemento dentro do próprio iframe
        content = await iframe_element.find(id='content')
        await content.take_screenshot('iframe-content.png')
```

## Exportação de Bundle da Página

Salve uma página inteira com todos os seus assets (CSS, JS, imagens, fontes) como um arquivo `.zip` para visualização offline.

### Uso Básico

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def save_page():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')

        # Salvar página com assets como arquivos separados
        await tab.save_bundle('page.zip')

asyncio.run(save_page())
```

O zip resultante contém um `index.html` com todas as URLs reescritas para referenciar arquivos locais no diretório `assets/`.

### Modo Inline

Incorpore tudo diretamente em um único `index.html` usando data URIs, `<style>` e `<script>`:

```python
# Um único arquivo HTML autocontido dentro do zip
await tab.save_bundle('page-inline.zip', inline_assets=True)
```

### Parâmetros

| Parâmetro | Tipo | Padrão | Descrição |
|-----------|------|--------|-----------|
| `path` | `str \| Path` | *(obrigatório)* | Caminho de destino. Deve terminar com `.zip`. |
| `inline_assets` | `bool` | `False` | Incorporar todos os assets inline em vez de salvá-los como arquivos separados. |

!!! info "O Que é Incluído no Bundle"
    O bundle inclui recursos dos tipos: Document, Stylesheet, Script, Image, Font e Media. Recursos que falharam ao carregar, foram cancelados ou usam URIs `data:` são automaticamente ignorados.

## Aprenda Mais

Para contexto adicional sobre como screenshots e PDFs se integram com a arquitetura do Pydoll:

- **[Análise Profunda: CDP](../../deep-dive/cdp.md)**: Entendendo os comandos do Chrome DevTools Protocol
- **[Referência da API: Tab](../../api/browser/tab.md#take_screenshot)**: Assinaturas de método e parâmetros completos
- **[Referência da API: WebElement](../../api/elements/web-element.md#take_screenshot)**: Capacidades de screenshot específicas de elementos

Screenshots e PDFs são ferramentas essenciais para automação, testes e documentação. A integração direta do Pydoll com o CDP fornece saída de nível profissional com controle refinado.

================================================
FILE: docs/pt/features/browser-management/contexts.md
================================================
# Contextos de Navegador (Browser Contexts)

Contextos de Navegador são a solução do Pydoll para criar ambientes de navegação completely isolados dentro de um único processo de navegador. Pense neles como "janelas anônimas" separadas, mas com controle programático total. Cada contexto mantém seus próprios cookies, armazenamento, cache e estado de autenticação.

## Guia Rápido

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def basic_context_example():
    async with Chrome() as browser:
        # Inicia o navegador com a aba inicial no contexto padrão
        initial_tab = await browser.start()
        await initial_tab.go_to('https://example.com')
        
        # Cria um contexto isolado
        context_id = await browser.create_browser_context()
        
        # Nova aba no contexto isolado
        isolated_tab = await browser.new_tab('https://example.com', browser_context_id=context_id)
        
        # Ambas as abas estão completamente isoladas - cookies, armazenamento, etc. diferentes
        await initial_tab.execute_script("localStorage.setItem('user', 'Alice')")
        await isolated_tab.execute_script("localStorage.setItem('user', 'Bob')")
        
        # Verifica o isolamento
        user_default = await initial_tab.execute_script("return localStorage.getItem('user')")
        user_isolated = await isolated_tab.execute_script("return localStorage.getItem('user')")
        
        print(f"Contexto padrão: {user_default}")  # Alice
        print(f"Contexto isolado: {user_isolated}")  # Bob

asyncio.run(basic_context_example())
```

## O que são Contextos de Navegador?

Um contexto de navegador é um ambiente de navegação isolado dentro de um único processo de navegador. Cada contexto mantém separadamente:

| Componente | Descrição | Nível de Isolamento |
|---|---|---|
| **Cookies** | Cookies HTTP e dados de sessão | ✓ Totalmente isolado |
| **Local Storage** | `localStorage` e `sessionStorage` | ✓ Totalmente isolado |
| **IndexedDB** | Banco de dados do lado do cliente | ✓ Totalmente isolado |
| **Cache** | Cache HTTP e recursos | ✓ Totalmente isolado |
| **Permissões** | Geolocalização, notificações, câmera, etc. | ✓ Totalmente isolado |
| **Autenticação** | Sessões de login e tokens de autenticação | ✓ Totalmente isolado |
| **Service Workers** | Scripts em segundo plano | ✓ Totalmente isolado |

```mermaid
graph LR
    Browser[Processo do Navegador] --> Default[Contexto Padrao]
    Browser --> Context1[Contexto 1]
    Browser --> Context2[Contexto 2]
    
    Default --> T1[Aba A]
    Default --> T2[Aba B]
    Context1 --> T3[Aba C]
    Context2 --> T4[Aba D]
```

## Por que Usar Contextos de Navegador?

### 1. Teste de Múltiplas Contas

Teste diferentes contas de usuário simultaneamente sem interferência:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def perform_login(tab, email, password):
    """
    Função auxiliar para navegar até a página de login
    e enviar as credenciais da conta.
    """
    print(f"Tentando login com: {email}...")
    await tab.go_to('https://app.example.com/login')

    # Encontrar elementos
    email_field = await tab.find(id='email')
    password_field = await tab.find(id='password')
    login_btn = await tab.find(id='login-btn')

    # Preencher credenciais e clicar
    await email_field.type_text(email)
    await password_field.type_text(password)
    await login_btn.click()

    # Esperar o login processar
    await asyncio.sleep(2)
    print(f"Login bem-sucedido para {email}.")


async def multi_account_test():
    """
    Script principal para testar logins simultâneos
    usando contextos de navegador isolados.
    """
    accounts = [
        {"email": "user1@example.com", "password": "pass1"},
        {"email": "user2@example.com", "password": "pass2"},
        {"email": "admin@example.com", "password": "admin_pass"}
    ]

    # Esta lista armazenará informações de cada sessão de usuário ativa.
    user_sessions = []

    async with Chrome() as browser:
        first_account = accounts[0]
        initial_tab = await browser.start()
        await perform_login(initial_tab, first_account['email'], first_account['password'])
        user_sessions.append({
            "email": first_account['email'],
            "tab": initial_tab,
            "context_id": None  # 'None' representa o contexto padrão do navegador
        })

        # Iterar sobre o restante das contas
        for account in accounts[1:]:
            context_id = await browser.create_browser_context()
            new_tab = await browser.new_tab(browser_context_id=context_id)
            await perform_login(new_tab, account['email'], account['password'])

            # Adicionar esta nova informação de sessão à lista
            user_sessions.append({
                "email": account['email'],
                "tab": new_tab,
                "context_id": context_id
            })

        print("\n--- Verificando todas as sessões activas ---")
        for session in user_sessions:
            tab = session["tab"]
            email = session["email"]
            await tab.go_to('https://app.example.com/dashboard')
            username = await tab.find(class_name='username')
            username_text = await username.text
            print(f"[Conta: {email}] -> Logado como: {username_text}")
            await asyncio.sleep(0.5)

        print("\n--- Limpando contextos ---")
        for session in user_sessions:
            # Fechar apenas os contextos que criamos (diferentes de None)
            if session["context_id"] is not None:
                print(f"Fechando contexto para: {session['email']}")
                await session["tab"].close()
                await browser.delete_browser_context(session["context_id"])
        
        # O contexto padrão (None) é fechado automaticamente
        # pelo 'async with Chrome() as browser'

asyncio.run(multi_account_test())
```

### 2. Teste de Geo-Localização com Proxies Específicos do Contexto

Cada contexto pode ter sua própria configuração de proxy:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def geo_location_testing():
    async with Chrome() as browser:
        # Inicia o navegador e usa a aba inicial para o primeiro teste (contexto padrão, sem proxy)
        initial_tab = await browser.start()
        await initial_tab.go_to('https://api.ipify.org')
        await asyncio.sleep(2)
        default_ip = await initial_tab.execute_script('return document.body.textContent')
        print(f"IP Padrão (sem proxy): {default_ip}")
        
        # Contexto dos EUA com proxy dos EUA
        us_context = await browser.create_browser_context(
            proxy_server='http://us-proxy.example.com:8080'
        )
        us_tab = await browser.new_tab('https://api.ipify.org', browser_context_id=us_context)
        await asyncio.sleep(2)
        us_ip = await us_tab.execute_script('return document.body.textContent')
        print(f"IP dos EUA: {us_ip}")
        
        # Contexto da UE com proxy da UE
        eu_context = await browser.create_browser_context(
            proxy_server='http://eu-proxy.example.com:8080'
        )
        eu_tab = await browser.new_tab('https://api.ipify.org', browser_context_id=eu_context)
        await asyncio.sleep(2)
        eu_ip = await eu_tab.execute_script('return document.body.textContent')
        print(f"IP da UE: {eu_ip}")
        
        # Limpeza (pular aba inicial)
        await us_tab.close()
        await eu_tab.close()
        await browser.delete_browser_context(us_context)
        await browser.delete_browser_context(eu_context)

asyncio.run(geo_location_testing())
```

!!! tip "Autenticação de Proxy"
    O Pydoll lida automaticamente com a autenticação de proxy para contextos. Apenas inclua as credenciais na URL:
    ```python
    context_id = await browser.create_browser_context(
        proxy_server='http://username:password@proxy.example.com:8080'
    )
    ```
    As credenciais são higienizadas dos comandos CDP e usadas apenas quando o navegador solicita autenticação.

### 3. Teste A/B

Compare diferentes experiências de usuário em paralelo:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def ab_testing():
    async with Chrome() as browser:
        # Inicia o navegador com a aba inicial (Grupo de Controle no contexto padrão)
        initial_tab = await browser.start()
        await initial_tab.go_to('https://example.com')
        await initial_tab.execute_script("localStorage.setItem('experiment', 'control')")
        
        # Grupo de Tratamento em contexto isolado
        context_b = await browser.create_browser_context()
        tab_b = await browser.new_tab('https://example.com', browser_context_id=context_b)
        await tab_b.execute_script("localStorage.setItem('experiment', 'treatment')")
        
        # Navega ambos para a página da funcionalidade
        await initial_tab.go_to('https://example.com/feature')
        await tab_b.go_to('https://example.com/feature')
        
        # Compara os resultados
        result_a = await initial_tab.find(class_name='experiment-result')
        result_b = await tab_b.find(class_name='experiment-result')
        
        print(f"Resultado do grupo de controle: {await result_a.text}")
        print(f"Resultado do grupo de tratamento: {await result_b.text}")
        
        # Limpeza
        await tab_b.close()
        await browser.delete_browser_context(context_b)

asyncio.run(ab_testing())
```

### 4. Raspagem Web Paralela

Raspe múltiplos sites com diferentes configurações:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def parallel_scraping():
    websites = [
        {'url': 'https://news.ycombinator.com', 'selector': '.storylink'},
        {'url': 'https://reddit.com/r/python', 'selector': '.title'},
        {'url': 'https://github.com/trending', 'selector': '.h3'},
    ]
    
    async with Chrome() as browser:
        # Inicia o navegador e obtém a aba inicial
        initial_tab = await browser.start()
        
        # Cria contextos para os sites restantes (o primeiro usa o contexto padrão)
        contexts = [None] + [await browser.create_browser_context() for _ in websites[1:]]
        
        # Cria abas (reutilizando a aba inicial para o primeiro site)
        tabs = [initial_tab] + [
            await browser.new_tab(browser_context_id=ctx) for ctx in contexts[1:]
        ]
        
        async def scrape_site(tab, site, context_id):
            """Raspa um único site dentro da aba e contexto fornecidos."""
            try:
                await tab.go_to(site['url'])
                await asyncio.sleep(3)
                
                # Extrai títulos usando seletor CSS
                elements = await tab.query(site['selector'], find_all=True)
                titles = [await elem.text for elem in elements[:5]]
                
                return {'url': site['url'], 'titles': titles}
            finally:
                # Limpa o contexto (pula o contexto padrão da aba inicial)
                if context_id is not None:
                    await tab.close()
                    await browser.delete_browser_context(context_id)
        
        # Raspa todos os sites concorrentemente
        results = await asyncio.gather(*[
            scrape_site(tab, site, ctx) for tab, site, ctx in zip(tabs, websites, contexts)
        ])
        
        # Exibe os resultados
        for result in results:
            print(f"\n{result['url']}:")
            for i, title in enumerate(result['titles'], 1):
                print(f"  {i}. {title}")

asyncio.run(parallel_scraping())
```

## Entendendo o Desempenho do Contexto

### Contextos São Leves

!!! info "Características de Desempenho"
    Criar um contexto de navegador é **significativamente mais rápido e leve** do que lançar um novo processo de navegador:
    
    - **Criação de contexto**: ~50-100ms, sobrecarga mínima de memória
    - **Novo processo de navegador**: ~2-5 segundos, 50-150 MB de memória base
    
    Para 10 ambientes isolados:

    - **10 contextos em 1 navegador**: ~500ms de inicialização, ~500 MB no total
    - **10 navegadores separados**: ~30 segundos de inicialização, ~1-1.5 GB no total

```python
import asyncio
import time
from pydoll.browser.chromium import Chrome

async def benchmark_contexts_vs_browsers():
    # Benchmark de contextos
    start = time.time()
    async with Chrome() as browser:
        # Inicia o navegador (aba inicial não usada neste exemplo)
        await browser.start()
        
        contexts = []
        for i in range(10):
            context_id = await browser.create_browser_context()
            contexts.append(context_id)
        
        print(f"10 contextos criados em: {time.time() - start:.2f}s")
        
        # Limpeza
        for context_id in contexts:
            await browser.delete_browser_context(context_id)

asyncio.run(benchmark_contexts_vs_browsers())
```

### Headless vs Headed: O Comportamento da Janela

!!! warning "Importante: Janelas de Contexto no Modo Headed"
    Ao rodar em **modo headed** (com UI do navegador visível), há um comportamento importante a entender:
    
    **A primeira aba criada em um novo contexto abrirá uma nova janela do sistema operacional.**
    
    - Isso acontece porque o contexto precisa de uma "janela hospedeira" para renderizar sua primeira página
    - Abas subsequentes nesse contexto podem abrir como abas dentro dessa janela
    - Esta é uma limitação do CDP/Chromium, não uma escolha de design do Pydoll
    
    **No modo headless**, isso não importa—nenhuma janela é criada, tudo roda em segundo plano.

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def demonstrate_window_behavior():
    # Modo headed - verá janelas
    options_headed = ChromiumOptions()
    options_headed.headless = False
    
    async with Chrome(options=options_headed) as browser:
        # Inicia o navegador com a aba inicial (abre a primeira janela no contexto padrão)
        initial_tab = await browser.start()
        await initial_tab.go_to('https://example.com')
        
        # Cria novo contexto - a primeira aba abrirá uma NOVA janela
        context = await browser.create_browser_context()
        tab2 = await browser.new_tab('https://github.com', browser_context_id=context)
        
        # Segunda aba no mesmo contexto - abre como aba na janela existente
        tab3 = await browser.new_tab('https://google.com', browser_context_id=context)
        
        await asyncio.sleep(10)  # Observe as janelas
        
        await tab2.close()
        await tab3.close()
        await browser.delete_browser_context(context)

# Modo headless - sem janelas, contextos são invisíveis mas ainda isolados
async def headless_contexts():
    options = ChromiumOptions()
    options.headless = True  # Sem janelas visíveis
    
    async with Chrome(options=options) as browser:
        # Inicia o navegador com a aba inicial no contexto padrão
        initial_tab = await browser.start()
        await initial_tab.go_to('https://example.com/page0')
        
        # Cria mais 4 contextos - nenhuma janela aberta, tudo em segundo plano
        contexts = []
        for i in range(1, 5):
            context_id = await browser.create_browser_context()
            tab = await browser.new_tab(f'https://example.com/page{i}', browser_context_id=context_id)
            contexts.append((context_id, tab))
        
        print(f"Criados {len(contexts) + 1} contextos isolados (1 padrão + {len(contexts)} personalizados, invisíveis)")
        
        # Limpeza
        for context_id, tab in contexts:
            await tab.close()
            await browser.delete_browser_context(context_id)

asyncio.run(headless_contexts())
```

!!! tip "Melhor Prática: Use Headless para Contextos"
    Para máxima eficiência com múltiplos contextos:
    
    - **Desenvolvimento/Depuração**: Use o modo headed para ver o que está acontecendo
    - **Produção/CI/CD**: Use o modo headless para execução mais rápida e leve
    - **Múltiplos contextos**: Prefira fortemente o headless para evitar a complexidade do gerenciamento de janelas

## Gerenciamento de Contexto

### Criando Contextos

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def create_context_example():
    async with Chrome() as browser:
        await browser.start()
        
        # Criar contexto básico
        context_id = await browser.create_browser_context()
        print(f"Contexto criado: {context_id}")
        
        # Criar contexto com proxy
        proxied_context = await browser.create_browser_context(
            proxy_server='http://proxy.example.com:8080',
            proxy_bypass_list='localhost,127.0.0.1'
        )
        print(f"Contexto com proxy criado: {proxied_context}")
        
        # Criar contexto com proxy autenticado
        auth_context = await browser.create_browser_context(
            proxy_server='http://user:pass@proxy.example.com:8080'
        )
        print(f"Contexto com autenticação criado: {auth_context}")

asyncio.run(create_context_example())
```

### Listando Contextos

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def list_contexts():
    async with Chrome() as browser:
        await browser.start()
        
        # Obter todos os contextos (inclui o padrão)
        contexts = await browser.get_browser_contexts()
        print(f"Contextos iniciais: {len(contexts)}")  # Geralmente 1 (padrão)
        
        # Criar contextos adicionais
        context1 = await browser.create_browser_context()
        context2 = await browser.create_browser_context()
        
        # Listar novamente
        contexts = await browser.get_browser_contexts()
        print(f"Após criar 2 novos contextos: {len(contexts)}")  # 3 no total
        
        for i, context_id in enumerate(contexts):
            print(f"  Contexto {i+1}: {context_id}")
        
        # Limpeza
        await browser.delete_browser_context(context1)
        await browser.delete_browser_context(context2)

asyncio.run(list_contexts())
```

### Deletando Contextos

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def delete_context_example():
    async with Chrome() as browser:
        await browser.start()
        
        # Criar contexto com abas
        context_id = await browser.create_browser_context()
        tab1 = await browser.new_tab('https://example.com', browser_context_id=context_id)
        tab2 = await browser.new_tab('https://github.com', browser_context_id=context_id)
        
        print(f"Contexto {context_id} criado com 2 abas")
        
        # Deletar o contexto fecha todas as suas abas automaticamente
        await browser.delete_browser_context(context_id)
        print("Contexto deletado (todas as abas fechadas automaticamente)")

asyncio.run(delete_context_example())
```

!!! warning "Deletar Contextos Fecha Todas as Abas"
    Quando você deleta um contexto de navegador, **todas as abas pertencentes a esse contexto são fechadas automaticamente**. Esta é uma maneira eficiente de limpar múltiplas abas de uma vez, mas certifique-se de ter salvo quaisquer dados importantes primeiro.

## Contexto Padrão

Todo navegador inicia com um **contexto padrão** que contém a aba inicial:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def default_context_example():
    async with Chrome() as browser:
        # Aba inicial está no contexto padrão
        initial_tab = await browser.start()
        
        # Criar aba sem especificar contexto - usa o padrão
        default_tab = await browser.new_tab('https://example.com')
        
        # Criar contexto personalizado
        custom_context = await browser.create_browser_context()
        custom_tab = await browser.new_tab('https://github.com', browser_context_id=custom_context)
        
        # Contextos padrão e personalizado são isolados
        await default_tab.execute_script("localStorage.setItem('type', 'default')")
        await custom_tab.execute_script("localStorage.setItem('type', 'custom')")
        
        # Verificar isolamento
        default_type = await default_tab.execute_script("return localStorage.getItem('type')")
        custom_type = await custom_tab.execute_script("return localStorage.getItem('type')")
        
        print(f"Contexto padrão: {default_type}")  # 'default'
        print(f"Contexto personalizado: {custom_type}")    # 'custom'
        
        # Limpar contexto personalizado
        await browser.delete_browser_context(custom_context)

asyncio.run(default_context_example())
```

!!! info "Você Não Pode Deletar o Contexto Padrão"
    O contexto padrão do navegador é permanente e não pode ser deletado. Ele existe por toda a sessão do navegador. Apenas contextos personalizados criados com `create_browser_context()` podem ser deletados.

## Padrões Avançados

### Pool de Contextos para Isolamento Reutilizável

```python
import asyncio
from pydoll.browser.chromium import Chrome

class ContextPool:
    def __init__(self, browser, size=5):
        self.browser = browser
        self.size = size
        self.contexts = []
        self.in_use = set()
    
    async def initialize(self):
        """Criar pool de contextos"""
        for _ in range(self.size):
            context_id = await self.browser.create_browser_context()
            self.contexts.append(context_id)
        print(f"Pool de contextos inicializado com {self.size} contextos")
    
    async def acquire(self):
        """Obter contexto disponível do pool"""
        for context_id in self.contexts:
            if context_id not in self.in_use:
                self.in_use.add(context_id)
                return context_id
        raise Exception("Nenhum contexto disponível no pool")
    
    def release(self, context_id):
        """Devolver contexto ao pool"""
        self.in_use.discard(context_id)
    
    async def cleanup(self):
        """Deletar todos os contextos no pool"""
        for context_id in self.contexts:
            await self.browser.delete_browser_context(context_id)

async def use_context_pool():
    async with Chrome() as browser:
        await browser.start()
        
        # Criar pool
        pool = ContextPool(browser, size=3)
        await pool.initialize()
        
        # Usar contextos do pool
        async def scrape_with_pool(url):
            context_id = await pool.acquire()
            try:
                tab = await browser.new_tab(url, browser_context_id=context_id)
                await asyncio.sleep(2)
                title = await tab.execute_script('return document.title')
                await tab.close()
                return title
            finally:
                pool.release(context_id)
        
        # Raspar múltiplas URLs usando o pool
        urls = [f'https://example.com/page{i}' for i in range(10)]
        results = await asyncio.gather(*[scrape_with_pool(url) for url in urls])
        
        for i, title in enumerate(results):
            print(f"{urls[i]}: {title}")
        
        # Limpeza
        await pool.cleanup()

asyncio.run(use_context_pool())
```

### Gerenciador de Configuração por Contexto

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def context_config_manager():
    async with Chrome() as browser:
        await browser.start()
        
        # Definir configurações para diferentes cenários
        configs = {
            'us_user': {
                'proxy': 'http://us-proxy.example.com:8080',
                'user_agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64)'
            },
            'eu_user': {
                'proxy': 'http://eu-proxy.example.com:8080',
                'user_agent': 'Mozilla/5.0 (X11; Linux x86_64)'
            },
            'mobile_user': {
                'proxy': None,
                'user_agent': 'Mozilla/5.0 (iPhone; CPU iPhone OS 14_0 like Mac OS X)'
            }
        }
        
        contexts = {}
        
        # Criar contexto para cada configuração
        for name, config in configs.items():
            if config['proxy']:
                context_id = await browser.create_browser_context(
                    proxy_server=config['proxy']
                )
            else:
                context_id = await browser.create_browser_context()
            
            # Criar aba e definir user agent
            tab = await browser.new_tab(browser_context_id=context_id)
            # Nota: User agent seria definido via CDP ou opções, simplificado aqui
            
            contexts[name] = {'context_id': context_id, 'tab': tab}
        
        # Usar diferentes contextos para diferentes cenários
        for name, data in contexts.items():
            tab = data['tab']
            await tab.go_to('https://httpbin.org/headers')
            await asyncio.sleep(2)
            print(f"\nConfiguração {name} ativa")
        
        # Limpeza
        for data in contexts.values():
            await data['tab'].close()
            await browser.delete_browser_context(data['context_id'])

asyncio.run(context_config_manager())
```

## Melhores Práticas

1.  **Use o modo headless para múltiplos contextos** para evitar a complexidade do gerenciamento de janelas
2.  **Sempre delete os contextos quando terminar** para evitar vazamentos de memória
3.  **Agrupe operações relacionadas no mesmo contexto** para melhor organização
4.  **Prefira contextos a múltiplos processos de navegador** para melhor desempenho
5.  **Use pools de contextos** para cenários que exigem muitos ambientes isolados de curta duração
6.  **Feche as abas antes de deletar os contextos** para uma limpeza mais organizada (embora não seja estritamente necessário)

## Veja Também

- **[Gerenciamento de Múltiplas Abas](tabs.md)** - Gerenciando múltiplas abas dentro de contextos
- **[Análise Profunda: Domínio do Navegador](../../deep-dive/browser-domain.md)** - Detalhes arquitetônicos sobre contextos
- **[Rede: Requisições HTTP](../network/http-requests.md)** - Requisições no contexto do navegador herdam o estado do contexto
- **[Conceitos Principais](../core-concepts.md)** - Entendendo a arquitetura do Pydoll

Contextos de Navegador são uma das funcionalidades mais poderosas do Pydoll para criar fluxos de trabalho de automação sofisticados. Ao entender como eles funcionam—especialmente o comportamento da janela no modo headed e sua natureza leve—você pode construir automação eficiente e escalável que lida com cenários complexos de múltiplos ambientes com facilidade.

================================================
FILE: docs/pt/features/browser-management/cookies-sessions.md
================================================
# Cookies e Sessões

Gerenciar cookies e sessões de forma eficaz é crucial para uma automação de navegador realista. Os sites usam cookies para rastrear autenticação, preferências e comportamento do usuário, e esperam que os navegadores se comportem de acordo.

## Por que os Cookies Importam para a Automação

Cookies são mais do que apenas dados armazenados: eles são uma impressão digital (fingerprint) da atividade do navegador:

- **Autenticação**: Cookies de sessão mantêm o estado de login entre as requisições
- **Prevenção de Rastreamento**: Sistemas anti-bot analisam padrões de cookies
- **Comportamento Realista**: Um navegador sem cookies parece suspeito
- **Persistência de Sessão**: Reutilizar cookies pode economizar tempo em logins repetidos

!!! warning "O Paradoxo dos Cookies"
    - **Muito limpo**: Um navegador sem cookies ou histórico parece ser um bot
    - **Muito obsoleto**: Usar a mesma sessão por semanas aciona alertas de segurança
    - **Ponto ideal**: Cookies novos com rotação ocasional e padrões de atividade realistas

## Guia Rápido

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def basic_cookie_management():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # Definir um cookie (usando um dict simples)
        cookies = [
            {
                'name': 'session_id',
                'value': 'abc123xyz',
                'domain': 'example.com',
                'path': '/',
                'secure': True,
                'httpOnly': True
            }
        ]
        await tab.set_cookies(cookies)
        
        # Obter todos os cookies
        all_cookies = await browser.get_cookies()
        print(f"Total de cookies: {len(all_cookies)}")
        
        # Deletar todos os cookies
        await tab.delete_all_cookies()

asyncio.run(basic_cookie_management())
```

## Entendendo os Tipos de Cookie

!!! info "TypedDict: Use Dicionários Regulares na Prática"
    Ao longo desta documentação, você verá referências a `CookieParam` e `Cookie`. Estes são tipos **TypedDict**, eles são apenas dicionários Python regulares com dicas de tipo para autocompletar da IDE e verificação de tipo.
    
    **Na prática, você usa dicionários regulares:**
    ```python
    # Isso é o que você realmente escreve:
    cookie = {'name': 'session', 'value': 'abc123', 'domain': 'example.com'}
    
    # A anotação de tipo é apenas para sua IDE:
    from pydoll.protocol.network.types import CookieParam
    cookie: CookieParam = {'name': 'session', 'value': 'abc123'}
    ```
    
    Todos os exemplos abaixo usam dicionários simples por simplicidade.

### Estrutura do Cookie

O tipo `Cookie` (recuperado do navegador) contém informações completas do cookie:

```python
{
    "name": str,           # Nome do cookie
    "value": str,          # Valor do cookie
    "domain": str,         # Domínio onde o cookie é válido
    "path": str,           # Caminho onde o cookie é válido
    "expires": float,      # Timestamp Unix (0 = cookie de sessão)
    "size": int,           # Tamanho em bytes
    "httpOnly": bool,      # Acessível apenas via HTTP (não JavaScript)
    "secure": bool,        # Enviado apenas por HTTPS
    "session": bool,       # True se expira quando o navegador fecha
    "sameSite": str,       # "Strict", "Lax", ou "None"
    "priority": str,       # "Low", "Medium", ou "High"
    "sourceScheme": str,   # "Unset", "NonSecure", ou "Secure"
    "sourcePort": int,     # Porta onde o cookie foi definido
}
```

### Estrutura do CookieParam

Ao **definir** cookies, use um dict (apenas `name` e `value` são obrigatórios):

```python
# Cookie simples com apenas campos obrigatórios
cookie = {
    'name': 'user_token',
    'value': 'token_value'
}

# Cookie completo com todos os campos opcionais
cookie = {
    'name': 'user_token',       # Obrigatório
    'value': 'token_value',     # Obrigatório
    'domain': 'example.com',    # Opcional: padrão é o domínio da página atual
    'path': '/',                # Opcional: padrão é /
    'secure': True,             # Opcional: Apenas HTTPS
    'httpOnly': True,           # Opcional: sem acesso JS
    'sameSite': 'Lax',          # Opcional: 'Strict', 'Lax', ou 'None'
    'expires': 1735689600,      # Opcional: timestamp Unix
    'priority': 'High',         # Opcional: 'Low', 'Medium', ou 'High'
}
```

!!! info "Comportamento Padrão de Campos Opcionais"
    Quando você omite campos opcionais:
    
    - `domain`: Usa o domínio da página atual
    - `path`: Padrão é `/`
    - `secure`: Padrão é `False`
    - `httpOnly`: Padrão é `False`
    - `sameSite`: Padrão do navegador (geralmente `Lax`)
    - `expires`: Cookie de sessão (deletado quando o navegador fecha)

## Operações de Gerenciamento de Cookies

### Definindo Cookies

#### Definir Múltiplos Cookies de Uma Vez

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def set_multiple_cookies():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        cookies = [
            {
                'name': 'session_id',
                'value': 'xyz789',
                'domain': 'example.com',
                'secure': True,
                'httpOnly': True,
                'sameSite': 'Strict'
            },
            {
                'name': 'preferences',
                'value': 'dark_mode=true',
                'domain': 'example.com',
                'path': '/settings'
            },
            {
                'name': 'analytics',
                'value': 'tracking_id_12345',
                'domain': 'example.com',
                'expires': 1735689600  # Expira em data específica
            }
        ]
        
        await tab.set_cookies(cookies)
        print(f"Definidos {len(cookies)} cookies")

asyncio.run(set_multiple_cookies())
```

#### Definir Cookies em Contexto Específico

```python
# Definir cookies em um contexto de navegador específico
context_id = await browser.create_browser_context()
await browser.set_cookies(cookies, browser_context_id=context_id)
```

!!! tip "Métodos de Aba vs Navegador para Definir Cookies"
    - `tab.set_cookies(cookies)`: Define cookies no contexto de navegador da aba (atalho conveniente)
    - `browser.set_cookies(cookies, browser_context_id=...)`: Define cookies com controle explícito de contexto
    
    Ambos os métodos adicionam cookies ao **contexto inteiro**, não apenas à página atual. Os cookies estarão disponíveis para todas as abas naquele contexto.

### Recuperando Cookies

#### Obter Todos os Cookies (Nível do Contexto)

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def get_cookies_example():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://github.com')
        
        # Esperar a página definir cookies
        await asyncio.sleep(2)
        
        # Opção 1: Obter cookies via aba (atalho para o contexto atual)
        cookies = await tab.get_cookies()
        
        # Opção 2: Obter cookies via navegador (controle explícito de contexto)
        # cookies = await browser.get_cookies()  # Mesmo que tab.get_cookies() para o contexto padrão
        
        print(f"Encontrados {len(cookies)} cookies:")
        for cookie in cookies:
            print(f"  - {cookie['name']}: {cookie['value'][:20]}...")
            print(f"    Domínio: {cookie['domain']}, Secure: {cookie['secure']}")

asyncio.run(get_cookies_example())
```

!!! tip "Métodos de Aba vs Navegador"
    - `tab.get_cookies()`: Retorna cookies do contexto de navegador da aba (atalho conveniente)
    - `browser.get_cookies()`: Retorna cookies do contexto padrão (ou especifique `browser_context_id`)
    
    Ambos os métodos retornam **todos os cookies** do contexto, não apenas os cookies para o domínio da página atual.

!!! warning "Limitação do Modo Incógnito"
    `browser.get_cookies()` **não funciona** com o modo incógnito nativo (flag `--incognito`). Esta é uma limitação do Chrome DevTools Protocol onde `Storage.getCookies` não consegue acessar cookies no modo incógnito nativo.
    
    **Solução:** Use `tab.get_cookies()` em vez disso, que usa `Network.getCookies` e funciona corretamente no modo incógnito.

#### Obter Cookies de Contexto Específico

```python
# Obter cookies de um contexto de navegador específico
context_id = await browser.create_browser_context()
cookies = await browser.get_cookies(browser_context_id=context_id)
```

### Deletando Cookies

#### Deletar Todos os Cookies

```python
# Deletar todos os cookies do contexto da aba atual
await tab.delete_all_cookies()

# Deletar todos os cookies de um contexto específico
await browser.delete_all_cookies(browser_context_id=context_id)
```

!!! warning "Cookies São Deletados Imediatamente"
    Quando você deleta cookies, eles são removidos do navegador imediatamente. O site pode não detectar isso até a próxima requisição ou recarregamento da página.

## Casos de Uso Práticos

### 1. Sessões de Login Persistentes

Reutilize cookies de autenticação entre execuções do script:

```python
import asyncio
import json
from pathlib import Path
from pydoll.browser.chromium import Chrome

COOKIE_FILE = Path('cookies.json')

async def save_cookies_after_login():
    """Fazer login e salvar cookies para uso futuro."""
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/login')
        
        # Realizar login (simplificado)
        email = await tab.find(id='email')
        password = await tab.find(id='password')
        await email.type_text('user@example.com')
        await password.type_text('secret')
        
        login_btn = await tab.find(id='login')
        await login_btn.click()
        await asyncio.sleep(3)
        
        # Salvar cookies
        cookies = await browser.get_cookies()
        COOKIE_FILE.write_text(json.dumps(cookies, indent=2))
        print(f"Salvos {len(cookies)} cookies em {COOKIE_FILE}")

async def reuse_saved_cookies():
    """Carregar cookies salvos para pular o login."""
    if not COOKIE_FILE.exists():
        print("Nenhum cookie salvo encontrado. Execute save_cookies_after_login() primeiro.")
        return
    
    # Carregar cookies do arquivo
    saved_cookies = json.loads(COOKIE_FILE.read_text())
    
    # Converter para formato simplificado (apenas campos obrigatórios)
    # Nota: get_cookies() retorna objetos Cookie detalhados com campos somente leitura
    # (size, session, sourceScheme, etc.). set_cookies() espera o formato CookieParam
    # apenas com os campos configuráveis.
    cookies_to_set = [
        {
            'name': c['name'],
            'value': c['value'],
            'domain': c['domain'],
            'path': c.get('path', '/'),
            'secure': c.get('secure', False),
            'httpOnly': c.get('httpOnly', False)
        }
        for c in saved_cookies
    ]
    
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Definir cookies antes de navegar
        await tab.set_cookies(cookies_to_set)
        print(f"Carregados {len(cookies_to_set)} cookies do arquivo")
        
        # Navegar - já deve estar logado
        await tab.go_to('https://example.com/dashboard')
        await asyncio.sleep(2)
        
        # Verificar login
        try:
            username = await tab.find(class_name='username')
            print(f"Logado como: {await username.text}")
        except Exception:
            print("Login falhou - os cookies podem ter expirado")

# Primeira execução: fazer login e salvar cookies
# asyncio.run(save_cookies_after_login())

# Execuções subsequentes: reutilizar cookies
asyncio.run(reuse_saved_cookies())
```

!!! note "Reformatação de Cookies Necessária"
    `get_cookies()` retorna **objetos `Cookie` detalhados** com atributos somente leitura como `size`, `session`, `sourceScheme` e `sourcePort`. Ao usar `set_cookies()`, você deve fornecer o **formato `CookieParam`** contendo apenas os campos configuráveis (`name`, `value`, `domain`, `path`, `secure`, `httpOnly`, `sameSite`, `expires`, `priority`).
    
    A etapa de reformatação no exemplo acima é **essencial**. Passar objetos `Cookie` brutos para `set_cookies()` pode causar erros ou comportamento inesperado.

!!! tip "Expiração de Cookies"
    Sempre verifique se os cookies salvos expiraram. Cookies de sessão (`session=True`) expiram quando o navegador fecha, enquanto cookies persistentes têm um timestamp `expires` que você pode validar.

### 2. Teste de Múltiplas Contas com Cookies Isolados

Cada contexto de navegador mantém cookies separados:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def test_multiple_accounts():
    accounts = [
        {'email': 'user1@example.com', 'cookie_value': 'session_user1'},
        {'email': 'user2@example.com', 'cookie_value': 'session_user2'},
    ]
    
    async with Chrome() as browser:
        initial_tab = await browser.start()
        
        # Primeira conta no contexto padrão
        cookies_user1 = [{
            'name': 'session',
            'value': accounts[0]['cookie_value'],
            'domain': 'example.com',
            'secure': True,
            'httpOnly': True
        }]
        await initial_tab.set_cookies(cookies_user1)
        await initial_tab.go_to('https://example.com/dashboard')
        
        # Segunda conta em contexto isolado
        context2 = await browser.create_browser_context()
        tab2 = await browser.new_tab(browser_context_id=context2)
        
        cookies_user2 = [{
            'name': 'session',
            'value': accounts[1]['cookie_value'],
            'domain': 'example.com',
            'secure': True,
            'httpOnly': True
        }]
        await browser.set_cookies(cookies_user2, browser_context_id=context2)
        await tab2.go_to('https://example.com/dashboard')
        
        # Ambos os usuários estão logados simultaneamente com sessões diferentes
        print("Usuário 1 e Usuário 2 logados com cookies isolados")
        
        await asyncio.sleep(5)
        
        # Limpeza
        await tab2.close()
        await browser.delete_browser_context(context2)

asyncio.run(test_multiple_accounts())
```

### 3. Rotação de Cookies para Scripts de Longa Duração

Atualize os cookies periodicamente para evitar detecção:

```python
import asyncio
import time
from pydoll.browser.chromium import Chrome

async def scrape_with_cookie_rotation():
    urls = [f'https://example.com/page{i}' for i in range(100)]
    
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Fazer login inicialmente
        await tab.go_to('https://example.com/login')
        # ... realizar login ...
        await asyncio.sleep(2)
        
        last_rotation = time.time()
        rotation_interval = 600  # Rotacionar a cada 10 minutos
        
        for url in urls:
            # Verificar se é hora de rotacionar os cookies
            if time.time() - last_rotation > rotation_interval:
                print("Rotacionando sessão...")
                
                # Deletar cookies antigos
                await tab.delete_all_cookies()
                
                # Fazer login novamente ou carregar cookies novos
                await tab.go_to('https://example.com/login')
                # ... realizar login novamente ...
                
                last_rotation = time.time()
            
            # Raspar página
            await tab.go_to(url)
            await asyncio.sleep(2)
            # ... extrair dados ...

asyncio.run(scrape_with_cookie_rotation())
```

!!! tip "Frequência de Rotação"
    A frequência ideal de rotação depende do seu caso de uso:
    
    - **Sites de alta segurança**: Rotacione a cada 5-15 minutos
    - **Sites normais**: Rotacione a cada 30-60 minutos
    - **Raspagem de baixo risco**: Rotacione a cada poucas horas


## Referência de Atributos de Cookie

| Atributo | Tipo | Descrição | Padrão |
|---|---|---|---|
| `name` | `str` | Nome do cookie | *Obrigatório* |
| `value` | `str` | Valor do cookie | *Obrigatório* |
| `domain` | `str` | Domínio onde o cookie é válido | Domínio da página atual |
| `path` | `str` | Caminho onde o cookie é válido | `/` |
| `secure` | `bool` | Enviar apenas por HTTPS | `False` |
| `httpOnly` | `bool` | Não acessível via JavaScript | `False` |
| `sameSite` | `CookieSameSite` | Proteção CSRF: `Strict`, `Lax`, `None` | Padrão do navegador (`Lax`) |
| `expires` | `float` | Timestamp Unix (0 = cookie de sessão) | `0` (sessão) |
| `priority` | `CookiePriority` | Prioridade do cookie: `Low`, `Medium`, `High` | `Medium` |

### Valores SameSite

```python
# Use valores string diretamente no seu dict de cookie:

'sameSite': 'Strict'  # Cookie enviado apenas para requisições do mesmo site
'sameSite': 'Lax'     # Cookie enviado para navegação de nível superior (padrão)
'sameSite': 'None'    # Cookie enviado para todas as requisições (requer secure=True)

# Ou use o enum para autocompletar da IDE:
from pydoll.protocol.network.types import CookieSameSite

cookie = {
    'name': 'session',
    'value': 'xyz',
    'sameSite': CookieSameSite.STRICT  # IDE autocompletará: STRICT, LAX, NONE
}
```

### Valores de Priority

```python
# Use valores string diretamente:

'priority': 'Low'     # Baixa prioridade (deletado primeiro quando espaço é necessário)
'priority': 'Medium'  # Média prioridade (padrão)
'priority': 'High'    # Alta prioridade (deletado por último)

# Ou use o enum:
from pydoll.protocol.network.types import CookiePriority

cookie = {
    'name': 'session',
    'value': 'xyz',
    'priority': CookiePriority.HIGH  # IDE autocompletará: LOW, MEDIUM, HIGH
}
```

## Padrões Comuns

### Gerenciador de Contexto para Cookies Temporários

```python
from contextlib import asynccontextmanager

@asynccontextmanager
async def temporary_cookies(browser, tab, cookies):
    """Define cookies temporários, executa código, depois restaura os cookies originais."""
    # Salvar cookies atuais
    original_cookies = await browser.get_cookies()
    
    try:
        # Definir cookies temporários
        await tab.delete_all_cookies()
        await tab.set_cookies(cookies)
        yield tab
    finally:
        # Restaurar cookies originais
        await tab.delete_all_cookies()
        cookies_to_restore = [
            {
                'name': c['name'],
                'value': c['value'],
                'domain': c['domain'],
                'path': c.get('path', '/')
            }
            for c in original_cookies
        ]
        await tab.set_cookies(cookies_to_restore)

# Uso
async with temporary_cookies(browser, tab, test_cookies):
    await tab.go_to('https://example.com')
    # ... realizar ações com cookies temporários ...
# Cookies originais restaurados automaticamente
```

!!! tip "Usando APIs Públicas"
    Este gerenciador de contexto aceita tanto `browser` quanto `tab` como parâmetros para usar APIs públicas. Como `tab` não expõe seu `browser` pai como uma propriedade pública, passá-lo explicitamente é a abordagem recomendada para acessar métodos de nível de navegador.

### Comparação de Fingerprint de Cookies

```python
def cookie_fingerprint(cookies):
    """Gera um fingerprint simples do estado dos cookies."""
    return {
        'count': len(cookies),
        'domains': set(c['domain'] for c in cookies),
        'names': sorted(c['name'] for c in cookies),
        'secure_count': sum(1 for c in cookies if c.get('secure')),
        'httponly_count': sum(1 for c in cookies if c.get('httpOnly')),
    }

# Comparar estados de cookies
before = await browser.get_cookies()
await tab.go_to('https://example.com')
after = await browser.get_cookies()

print(f"Antes: {cookie_fingerprint(before)}")
print(f"Depois: {cookie_fingerprint(after)}")
```

## Considerações de Segurança

!!! danger "Nunca Codifique Cookies Sensíveis"
    Sempre carregue cookies de autenticação de armazenamento seguro (variáveis de ambiente, arquivos criptografados, gerenciadores de segredos).
    
    ```python
    # Ruim - codificado no código
    cookies = [{'name': 'session', 'value': 'abc123secret'}]
    
    # Bom - carregado do ambiente
    import os
    cookies = [{
        'name': 'session',
        'value': os.getenv('SESSION_COOKIE'),
        'domain': os.getenv('COOKIE_DOMAIN')
    }]
    ```

!!! warning "Proteção Contra Roubo de Cookies"
    Ao salvar cookies em disco:
    
    - Use armazenamento criptografado (ex: biblioteca `cryptography`)
    - Defina permissões restritivas de arquivo
    - Nunca envie arquivos de cookies para o controle de versão
    - Rotacione os cookies regularmente

## Resumo das Melhores Práticas

1.  **Comece com cookies realistas** - Não execute automação com um navegador completamente limpo
2.  **Rotacione sessões periodicamente** - Evite usar os mesmos cookies por longos períodos
3.  **Respeite os atributos de segurança dos cookies** - Use `secure`, `httpOnly`, `sameSite` apropriadamente
4.  **Salve e reutilize cookies de autenticação** - Pule logins repetitivos quando apropriado
5.  **Isole contextos para testes de múltiplas contas** - Cada contexto tem cookies independentes
6.  **Monitore a evolução dos cookies** - A navegação real acumula cookies naturalmente
7.  **Limpe cookies expirados** - Remova cookies inválidos antes de reutilizar
8.  **Use armazenamento seguro** - Criptografe cookies salvos, nunca codifique segredos

## Veja Também

- **[Contextos de Navegador](contexts.md)** - Ambientes de cookies isolados
- **[Requisições HTTP](../network/http-requests.md)** - Requisições no contexto do navegador herdam cookies automaticamente
- **[Interações Semelhantes a Humanas](../automation/human-interactions.md)** - Combine cookies com comportamento realista
- **[Referência da API: Comandos de Armazenamento](/api/commands/storage_commands/)** - Métodos completos de cookies do CDP

O gerenciamento eficaz de cookies é a base para uma automação de navegador realista. Ao equilibrar o frescor com a persistência e respeitar os atributos de segurança, você pode construir uma automação que se comporta como um usuário real, mantendo-se eficiente e sustentável.

================================================
FILE: docs/pt/features/browser-management/tabs.md
================================================
# Gerenciamento de Múltiplas Abas

O Pydoll oferece capacidades sofisticadas de múltiplas abas que permitem fluxos de trabalho de automação complexos, abrangendo várias abas do navegador simultaneamente. Entender como as abas funcionam no Pydoll é essencial para construir uma automação robusta e escalável.

## Entendendo as Abas no Pydoll

No Pydoll, uma instância de `Tab` representa uma única aba (ou janela) do navegador e fornece a interface principal para todas as operações de automação de página. Cada aba mantém seus próprios:

- **Contexto de execução independente**: JavaScript, DOM e estado da página
- **Manipuladores de eventos isolados**: Callbacks registrados em uma aba não afetam outras
- **Monitoramento de rede separado**: Cada aba pode rastrear sua própria atividade de rede
- **Conexão CDP única**: Comunicação WebSocket direta com o navegador

```mermaid
graph LR
    Browser[Instancia do Navegador] --> Tab1[Aba 1]
    Browser --> Tab2[Aba 2]
    Browser --> Tab3[...]
    
    Tab1 --> Features1[Contexto<br/>Independente]
    Tab2 --> Features2[Contexto<br/>Independente]
```

| Componente da Aba | Descrição | Independência |
|---|---|---|
| **Contexto de Execução** | Runtime JavaScript, DOM, estado da página | ✓ Cada aba tem o seu |
| **Manipuladores de Eventos** | Callbacks registrados para eventos CDP | ✓ Isolados por aba |
| **Monitoramento de Rede** | Requisições HTTP, respostas, tempos | ✓ Rastreia separadamente |
| **Conexão CDP** | Canal de comunicação WebSocket | ✓ Conexão direta |

### O que é uma Aba de Navegador?

Uma aba de navegador é tecnicamente um **alvo (target) CDP** - um contexto de navegação isolado com seu próprio:

- Document Object Model (DOM)
- Ambiente de execução JavaScript
- Pool de conexões de rede
- Armazenamento de cookies (compartilhado com outras abas no mesmo contexto)
- Loop de eventos e motor de renderização

Cada aba tem um `target_id` único atribuído pelo navegador, que o Pydoll usa para rotear comandos e eventos corretamente.

## Gerenciamento de Instâncias de Aba

A classe `Browser` do Pydoll mantém um registro de instâncias de `Tab` com base no `target_id` de cada aba. Isso garante que múltiplas referências à mesma aba do navegador sempre retornem o mesmo objeto Tab. O Browser armazena essas instâncias em um dicionário interno `_tabs_opened`.

| Benefício | Descrição |
|---|---|
| **Eficiência de Recursos** | Uma instância de Tab por aba do navegador, sem duplicatas |
| **Estado Consistente** | Todas as referências compartilham os mesmos manipuladores de eventos e estado |
| **Segurança de Memória** | Evita múltiplas conexões WebSocket para o mesmo alvo |
| **Comportamento Previsível** | Mudanças em uma referência afetam todas as referências |

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def tab_registry_demonstration():
    async with Chrome() as browser:
        # Inicia o navegador com a aba inicial
        tab1 = await browser.start()

        # Obtém a mesma aba através de métodos diferentes
        # Nota: get_opened_tabs() retorna as abas em ordem inversa (mais nova primeiro)
        # Então a aba inicial (mais antiga) está no final
        opened_tabs = await browser.get_opened_tabs()
        tab2 = opened_tabs[-1]  # A aba inicial é a mais antiga, então é a última

        # Ambas as referências apontam para o mesmo objeto
        # porque o Browser retorna a mesma instância de seu registro
        print(f"Mesma instância? {tab1 is tab2}")  # True
        print(f"Mesmo target ID? {tab1._target_id == tab2._target_id}")  # True

        # Registrar evento em uma referência afeta a outra
        await tab1.enable_network_events()
        print(f"Eventos de rede na aba 2? {tab2.network_events_enabled}")  # True

        # O Browser mantém o registro internamente
        print(f"Aba registrada no navegador? {tab1._target_id in browser._tabs_opened}")  # True

asyncio.run(tab_registry_demonstration())
```

!!! info "Registro controlado pelo Browser"
    A classe Browser gerencia um dicionário `_tabs_opened` indexado por `target_id`. Quando você solicita uma aba (via `new_tab()` ou `get_opened_tabs()`), o Browser verifica este registro primeiro. Se uma instância de Tab já existe para aquele `target_id`, ele retorna a instância existente; caso contrário, cria uma nova e a armazena no registro. (Iframes não geram mais abas separadas — interaja com eles como elementos normais.)

## Criando e Gerenciando Abas

### Iniciando o Navegador

Quando você inicia o navegador, o Pydoll automaticamente cria e retorna uma instância de Tab para a aba inicial do navegador:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def start_browser():
    async with Chrome() as browser:
        # Aba inicial é criada automaticamente
        tab = await browser.start()
        
        print(f"Aba criada com target ID: {tab._target_id}")
        await tab.go_to('https://example.com')
        
        title = await tab.execute_script('return document.title')
        print(f"Título da página: {title}")

asyncio.run(start_browser())
```

### Criando Abas Adicionais Programaticamente

Use `browser.new_tab()` para criar abas adicionais com controle total:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def create_multiple_tabs():
    async with Chrome() as browser:
        # Começar com a aba inicial
        main_tab = await browser.start()
        
        # Criar abas adicionais com URLs específicas
        search_tab = await browser.new_tab('https://google.com')
        docs_tab = await browser.new_tab('https://docs.python.org')
        news_tab = await browser.new_tab('https://news.ycombinator.com')
        
        # Cada aba pode ser controlada independentemente
        await search_tab.find(name='q')  # Caixa de busca do Google
        await docs_tab.find(id='search-field')  # Busca da doc do Python
        await news_tab.find(class_name='storylink', find_all=True)  # Matérias do HN
        
        # Obter todas as abas abertas
        all_tabs = await browser.get_opened_tabs()
        print(f"Total de abas: {len(all_tabs)}")  # 4 (inicial + 3 novas)
        
        # Fechar abas específicas quando terminar
        await search_tab.close()
        await docs_tab.close()
        await news_tab.close()

asyncio.run(create_multiple_tabs())
```

!!! tip "Parâmetro de URL Opcional"
    Você pode criar abas sem especificar uma URL: `await browser.new_tab()`. A aba abrirá com uma página em branco (`about:blank`), pronta para navegação.

### Lidando com Abas Abertas pelo Usuário

Quando usuários clicam em links com `target="_blank"` ou usam "Abrir em nova aba", o Pydoll pode detectar e gerenciar essas abas:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def handle_user_tabs():
    async with Chrome() as browser:
        main_tab = await browser.start()
        await main_tab.go_to('https://example.com')
        
        # Registrar contagem inicial de abas
        initial_tabs = await browser.get_opened_tabs()
        print(f"Abas iniciais: {len(initial_tabs)}")
        
        # Clicar em um link que abre uma nova aba (target="_blank")
        external_link = await main_tab.find(text='Open in New Tab')
        await external_link.click()
        
        # Esperar a nova aba abrir
        await asyncio.sleep(2)
        
        # Detectar novas abas
        current_tabs = await browser.get_opened_tabs()
        print(f"Abas atuais: {len(current_tabs)}")
        
        # Encontrar a aba recém-aberta (última da lista)
        if len(current_tabs) > len(initial_tabs):
            new_tab = current_tabs[-1]
            
            # Trabalhar com a nova aba
            url = await new_tab.current_url
            print(f"URL da nova aba: {url}")
            
            await new_tab.go_to('https://different-site.com')
            title = await new_tab.execute_script('return document.title')
            print(f"Título da nova aba: {title}")
            
            # Fechá-la quando terminar
            await new_tab.close()

asyncio.run(handle_user_tabs())
```

### Listando Todas as Abas Abertas

Use `browser.get_opened_tabs()` para recuperar todas as abas atualmente abertas:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def list_tabs():
    async with Chrome() as browser:
        # Usar a aba inicial retornada pelo start()
        initial_tab = await browser.start()
        await initial_tab.go_to('https://example.com')
        
        # Abrir várias outras abas
        await browser.new_tab('https://github.com')
        await browser.new_tab('https://stackoverflow.com')
        await browser.new_tab('https://reddit.com')
        
        # Obter todas as abas
        all_tabs = await browser.get_opened_tabs()
        
        # Inspecionar cada aba
        for i, tab in enumerate(all_tabs, 1):
            url = await tab.current_url
            title = await tab.execute_script('return document.title')
            print(f"Aba {i}: {title} - {url}")

asyncio.run(list_tabs())
```

## Operações Concorrentes de Abas

A arquitetura assíncrona do Pydoll permite fluxos de trabalho concorrentes poderosos em múltiplas abas:

### Coleta de Dados Paralela

Processe múltiplas páginas simultaneamente para máxima eficiência:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def scrape_page(tab, url):
    """Raspar uma única página dentro de uma aba específica."""
    await tab.go_to(url)
    title = await tab.execute_script('return document.title')
    articles = await tab.find(class_name='article', find_all=True)
    content = [await article.text for article in articles[:5]]

    return {
        'url': url,
        'title': title,
        'articles_count': len(articles),
        'sample_content': content
    }

async def concurrent_scraping():
    urls = [
        'https://example.com/page1',
        'https://example.com/page2',
        'https://example.com/page3',
        'https://example.com/page4',
    ]

    async with Chrome() as browser:
        # Iniciar o navegador e abrir a primeira aba
        initial_tab = await browser.start()
        # Criar uma aba por URL
        tabs = [initial_tab] + [await browser.new_tab() for _ in urls[1:]]

        # Executar todos os scrapers concorrentemente
        results = await asyncio.gather(*[
            scrape_page(tab, url) for tab, url in zip(tabs, urls)
        ])

        # Exibir resultados
        for result in results:
            print(f"\n{result['title']}")
            print(f"  URL: {result['url']}")
            print(f"  Artigos: {result['articles_count']}")
            if result['sample_content']:
                print(f"  Amostra: {result['sample_content'][0][:100]}...")

asyncio.run(concurrent_scraping())
```

!!! tip "Ganho de Desempenho"
    A raspagem concorrente pode reduzir o tempo total de execução em 5 a 10 vezes em comparação com o processamento sequencial, especialmente para tarefas limitadas por I/O (entrada/saída) como carregamento de página.

### Fluxos de Trabalho Coordenados de Múltiplas Abas

Orquestre fluxos de trabalho complexos que exigem a interação de múltiplas abas:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.network.events import NetworkEvent, RequestWillBeSentEvent

async def multi_tab_workflow():
    async with Chrome() as browser:
        # Usar a aba inicial para login
        login_tab = await browser.start()
        await login_tab.go_to('https://app.example.com/login')
        await asyncio.sleep(2)
        
        username = await login_tab.find(id='username')
        password = await login_tab.find(id='password')
        
        await username.type_text('admin@example.com')
        await password.type_text('secure_password')
        
        login_btn = await login_tab.find(id='login')
        await login_btn.click()
        await asyncio.sleep(3)
        
        # Aba 2: Navegar para a página de exportação de dados
        export_tab = await browser.new_tab('https://app.example.com/export')
        await asyncio.sleep(2)
        
        export_btn = await export_tab.find(text='Export Data')
        await export_btn.click()
        
        # Aba 3: Monitorar chamadas de API em um dashboard
        monitor_tab = await browser.new_tab('https://app.example.com/dashboard')
        await monitor_tab.enable_network_events()
        
        # Rastrear chamadas de API
        api_calls = []
        async def track_api(event: RequestWillBeSentEvent):
            url = event['params']['request']['url']
            if '/api/' in url:
                api_calls.append(url)
        
        await monitor_tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, track_api)
        await asyncio.sleep(5)
        
        print(f"Rastreadas {len(api_calls)} chamadas de API:")
        for call in api_calls[:10]:
            print(f"  - {call}")
        
        # Limpeza
        await login_tab.close()
        await export_tab.close()
        await monitor_tab.close()

asyncio.run(multi_tab_workflow())
```

## Ciclo de Vida e Limpeza da Aba

### Fechamento Explícito de Aba

Sempre feche as abas quando terminar de usá-las para liberar recursos do navegador:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def explicit_cleanup():
    async with Chrome() as browser:
        initial_tab = await browser.start()
        
        # Criar abas para diferentes tarefas
        tab1 = await browser.new_tab('https://example.com')
        tab2 = await browser.new_tab('https://example.org')
        
        # Trabalhar com as abas
        await tab1.go_to('https://different-site.com')
        await tab2.take_screenshot('/tmp/screenshot.png')
        
        # Fechar abas explicitamente
        await tab1.close()
        await tab2.close()
        
        # Verificar se as abas estão fechadas
        remaining = await browser.get_opened_tabs()
        print(f"Abas restantes: {len(remaining)}")  # Deve ser 1 (inicial)

asyncio.run(explicit_cleanup())
```

!!! warning "Vazamentos de Memória"
    Deixar de fechar abas em automações de longa duração pode levar ao esgotamento da memória. Cada aba consome recursos do navegador (memória, handles de arquivo, conexões de rede).

### Usando Gerenciadores de Contexto para Limpeza Automática

Embora o Pydoll não forneça um gerenciador de contexto de aba nativo, você pode criar o seu:

```python
import asyncio
from contextlib import asynccontextmanager
from pydoll.browser.chromium import Chrome

@asynccontextmanager
async def managed_tab(browser, url=None):
    """Gerenciador de contexto para limpeza automática de abas."""
    tab = await browser.new_tab(url)
    try:
        yield tab
    finally:
        await tab.close()

async def auto_cleanup_example():
    async with Chrome() as browser:
        initial_tab = await browser.start()
        
        # Aba fecha automaticamente ao sair do contexto
        async with managed_tab(browser, 'https://example.com') as tab:
            title = await tab.execute_script('return document.title')
            print(f"Título: {title}")
            
            await tab.take_screenshot('/tmp/page.png')
        # Aba é fechada automaticamente aqui
        
        tabs = await browser.get_opened_tabs()
        print(f"Abas após sair do contexto: {len(tabs)}")  # 1 (apenas initial_tab)

asyncio.run(auto_cleanup_example())
```

### Limpeza do Navegador

Quando o navegador fecha, todas as abas são fechadas automaticamente:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def browser_cleanup():
    # Usando gerenciador de contexto - limpeza automática
    async with Chrome() as browser:
        initial_tab = await browser.start()
        
        # Criar múltiplas abas
        await browser.new_tab('https://example.com')
        await browser.new_tab('https://github.com')
        await browser.new_tab('https://stackoverflow.com')
        
        tabs = await browser.get_opened_tabs()
        print(f"Abas abertas: {len(tabs)}")  # 4 (inicial + 3 novas)
    
    # Todas as abas são fechadas automaticamente quando o navegador sai
    print("Navegador fechado, todas as abas limpas")

asyncio.run(browser_cleanup())
```

## Gerenciamento de Estado da Aba

### Verificando o Estado da Aba

Consulte vários aspectos do estado atual de uma aba:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def check_tab_state():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # Verificar URL atual
        url = await tab.current_url
        print(f"URL Atual: {url}")
        
        # Verificar código-fonte da página
        source = await tab.page_source
        print(f"Tamanho do código-fonte: {len(source)} caracteres")
        
        # Verificar domínios de eventos habilitados
        print(f"Eventos de página habilitados: {tab.page_events_enabled}")
        print(f"Eventos de rede habilitados: {tab.network_events_enabled}")
        print(f"Eventos DOM habilitados: {tab.dom_events_enabled}")
        
        # Habilitar eventos e verificar novamente
        await tab.enable_network_events()
        print(f"Eventos de rede habilitados: {tab.network_events_enabled}")  # True

asyncio.run(check_tab_state())
```

### Identificação da Aba

Cada aba possui identificadores únicos:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def tab_identification():
    async with Chrome() as browser:
        tab1 = await browser.start()
        tab2 = await browser.new_tab()
        
        # Target ID - identificador único atribuído pelo navegador
        print(f"Target ID da Aba 1: {tab1._target_id}")
        print(f"Target ID da Aba 2: {tab2._target_id}")
        
        # Detalhes da conexão
        print(f"Porta de conexão da Aba 1: {tab1._connection_port}")
        print(f"Porta de conexão da Aba 2: {tab2._connection_port}")
        
        # ID do contexto do navegador (geralmente None para o contexto padrão)
        print(f"ID do contexto da Aba 1: {tab1._browser_context_id}")
        print(f"ID do contexto da Aba 2: {tab2._browser_context_id}")

asyncio.run(tab_identification())
```

## Funcionalidades Avançadas de Aba

### Trazendo Abas para a Frente

Torne uma aba específica visível (trazer para o primeiro plano):

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def bring_to_front():
    async with Chrome() as browser:
        tab1 = await browser.start()
        tab2 = await browser.new_tab('https://github.com')
        tab3 = await browser.new_tab('https://stackoverflow.com')
        
        # tab3 está atualmente na frente (última criada)
        await asyncio.sleep(2)
        
        # Trazer tab1 para a frente
        await tab1.bring_to_front()
        print("Aba 1 trazida para a frente")
        
        await asyncio.sleep(2)
        
        # Trazer tab2 para a frente
        await tab2.bring_to_front()
        print("Aba 2 trazida para a frente")

asyncio.run(bring_to_front())
```

### Monitoramento de Rede Específico da Aba

Cada aba pode monitorar independentemente sua própria atividade de rede:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def tab_network_monitoring():
    async with Chrome() as browser:
        # Usar aba inicial para navegação monitorada
        tab1 = await browser.start()
        await tab1.go_to('https://example.com')
        
        # Criar segunda aba sem monitoramento
        tab2 = await browser.new_tab('https://github.com')
        
        # Habilitar monitoramento de rede apenas na aba 1
        await tab1.enable_network_events()
        
        # Navegar em ambas as abas
        await tab1.go_to('https://example.com/page1')
        await tab2.go_to('https://github.com/explore')
        
        await asyncio.sleep(3)
        
        # Obter logs de rede apenas da aba 1
        tab1_logs = await tab1.get_network_logs()
        print(f"Requisições de rede da Aba 1: {len(tab1_logs)}")
        
        # tab2 não tem monitoramento de rede
        print(f"Eventos de rede da Aba 2 habilitados: {tab2.network_events_enabled}")  # False

asyncio.run(tab_network_monitoring())
```

### Manipuladores de Eventos Específicos da Aba

Registre diferentes manipuladores de eventos em diferentes abas:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.page.events import PageEvent

async def tab_specific_events():
    async with Chrome() as browser:
        # Usar aba inicial como primeira aba
        tab1 = await browser.start()
        tab2 = await browser.new_tab()
        
        # Habilitar eventos de página em ambas
        await tab1.enable_page_events()
        await tab2.enable_page_events()
        
        # Manipuladores diferentes para cada aba
        async def tab1_handler(event):
            print("Aba 1 carregada!")
        
        async def tab2_handler(event):
            print("Aba 2 carregada!")
        
        await tab1.on(PageEvent.LOAD_EVENT_FIRED, tab1_handler)
        await tab2.on(PageEvent.LOAD_EVENT_FIRED, tab2_handler)
        
        # Navegar em ambas as abas
        await tab1.go_to('https://example.com')
        await tab2.go_to('https://github.com')
        
        await asyncio.sleep(2)

asyncio.run(tab_specific_events())
```

## Considerações de Desempenho

| Cenário | Impacto nos Recursos | Recomendação |
|---|---|---|
| **1-5 abas** | Baixo | Gerenciamento direto, sem tratamento especial |
| **5-20 abas** | Moderado | Usar semáforos para limitar concorrência |
| **20-50 abas** | Alto | Processamento em lote, fechar abas agressivamente |
| **50+ abas** | Muito Alto | Considerar processamento sequencial ou múltiplos navegadores |

### Uso de Memória

Cada aba consome aproximadamente:

- **Memória base**: 50-100 MB
- **Com eventos de rede**: +10-20 MB
- **Com eventos DOM**: +20-50 MB
- **Página complexa (SPA)**: +100-300 MB

Para 20 abas com monitoramento de rede: ~1.5-3 GB de memória.

## Padrões Comuns

### Processamento Sequencial com Aba Única

```python
async def sequential_pattern():
    async with Chrome() as browser:
        tab = await browser.start()
        
        for url in urls:
            await tab.go_to(url)
            # Extrair dados
            await tab.clear_callbacks()  # Limpar eventos

asyncio.run(sequential_pattern())
```

### Processamento Paralelo com Múltiplas Abas

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def parallel_pattern():
    urls = [
        'https://example.com/page1',
        'https://example.com/page2',
        'https://example.com/page3',
        'https://example.com/page4',
    ]

    async with Chrome() as browser:
        # Iniciar navegador e obter aba inicial
        initial_tab = await browser.start()
        # Criar uma aba por URL (reutilizando a inicial para a primeira)
        tabs = [initial_tab] + [await browser.new_tab() for _ in urls[1:]]

        async def process_page(tab, url):
            """Processar uma única página dentro da aba fornecida."""
            try:
                await tab.go_to(url)
                await asyncio.sleep(2)
                title = await tab.evaluate('document.title')
                print(f"[{url}] {title}")
            finally:
                if tab is not initial_tab:
                    await tab.close()

        # Executar todas as abas concorrentemente
        await asyncio.gather(*[
            process_page(tab, url) for tab, url in zip(tabs, urls)
        ])

asyncio.run(parallel_pattern())
```

### Padrão de Pool de Workers

```python
async def worker_pool_pattern():
    async with Chrome() as browser:
        # Usar aba inicial como primeiro worker
        initial_tab = await browser.start()
        
        # Criar abas worker adicionais (5 workers no total: 1 inicial + 4 novas)
        workers = [initial_tab] + [await browser.new_tab() for _ in range(4)]
        
        # Distribuir trabalho entre todos os workers
        for url in urls:
            worker = workers[urls.index(url) % len(workers)]
            await worker.go_to(url)
            # Processar...
        
        # Limpar todos os workers (incluindo aba inicial)
        for worker in workers:
            await worker.close()

asyncio.run(worker_pool_pattern())
```

!!! tip "Reutilizando a Aba Inicial"
    Sempre use a aba retornada por `browser.start()` em vez de deixá-la ociosa. Isso economiza recursos do navegador e melhora o desempenho. Nos exemplos acima, a aba inicial é reutilizada como o primeiro worker ou para a primeira URL do lote.

## Veja Também

- **[Contextos de Navegador](contexts.md)** - Sessões de navegador isoladas
- **[Cookies e Sessões](cookies-sessions.md)** - Gerenciando cookies entre abas
- **[Sistema de Eventos](../advanced/event-system.md)** - Manipulação de eventos específica da aba
- **[Raspagem Concorrente](../../features.md#concurrent-scraping)** - Exemplos do mundo real

O gerenciamento de múltiplas abas no Pydoll fornece a base para construir automação de navegador escalável e eficiente. Ao entender o ciclo de vida da aba, o padrão singleton e as melhores práticas, você pode criar fluxos de trabalho de automação robustos que lidam com cenários complexos de múltiplas páginas com facilidade.

================================================
FILE: docs/pt/features/configuration/browser-options.md
================================================
# Opções do Navegador (ChromiumOptions)

`ChromiumOptions` é seu hub central de configuração para personalizar o comportamento do navegador. Ele controla tudo, desde argumentos de linha de comando e localização do binário até estados de carregamento de página e preferências de conteúdo.

!!! info "Documentação Relacionada"
    - **[Preferências do Navegador](browser-preferences.md)** - Análise profunda do sistema interno de preferências do Chromium
    - **[Gerenciamento do Navegador](../browser-management/tabs.md)** - Trabalhando com instâncias e abas do navegador
    - **[Contextos](../browser-management/contexts.md)** - Contextos de navegação isolados

## Guia Rápido

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions
from pydoll.constants import PageLoadState

async def main():
    # Criar e configurar opções
    options = ChromiumOptions()
    
    # Configuração básica
    options.headless = True
    options.start_timeout = 15
    options.page_load_state = PageLoadState.INTERACTIVE
    
    # Adicionar argumentos de linha de comando
    options.add_argument('--disable-gpu')
    options.add_argument('--window-size=1920,1080')
    
    # Métodos auxiliares para configurações comuns
    options.block_notifications = True
    options.block_popups = True
    options.set_default_download_directory('/tmp/downloads')
    
    # Usar as opções configuradas
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')

asyncio.run(main())
```

## Propriedades Principais

### Argumentos de Linha de Comando

O Chromium suporta centenas de "switches" (opções) de linha de comando que controlam o comportamento do navegador no nível mais profundo. Use `add_argument()` para passar flags diretamente para o processo do navegador.

```python
options = ChromiumOptions()

# Adicionar argumento único
options.add_argument('--disable-blink-features=AutomationControlled')

# Adicionar argumento com valor
options.add_argument('--window-size=1920,1080')
options.add_argument('--user-agent=Mozilla/5.0 ...')

# Remover argumento se necessário
options.remove_argument('--window-size=1920,1080')

# Obter todos os argumentos
all_args = options.arguments
```

!!! tip "Formato dos Argumentos"
    - Argumentos começando com `--` são flags: `--headless`, `--disable-gpu`
    - Argumentos com `=` têm valores: `--window-size=1920,1080`
    - Alguns aceitam múltiplos valores: `--disable-features=Feature1,Feature2`

**Veja a [Referência de Argumentos de Linha de Comando](#referência-de-argumentos-de-linha-de-comando) abaixo para listas abrangentes.**

### Localização do Binário

Especifique um executável de navegador personalizado em vez de usar o padrão do sistema:

```python
options = ChromiumOptions()

# Linux
options.binary_location = '/opt/google/chrome-beta/chrome'

# macOS
options.binary_location = '/Applications/Google Chrome Canary.app/Contents/MacOS/Google Chrome Canary'

# Windows
options.binary_location = r'C:\Program Files\Google\Chrome Beta\Application\chrome.exe'
```

!!! info "Quando Definir a Localização do Binário"
    - Testar diferentes versões do Chrome (Estável, Beta, Canary)
    - Usar o Chromium em vez do Chrome
    - Usar instalações portáteis do navegador
    - Executar compilações específicas para depuração

### Timeout de Inicialização

Controle quanto tempo o Pydoll espera para o navegador iniciar e responder:

```python
options = ChromiumOptions()
options.start_timeout = 20  # segundos (padrão: 10)
```

!!! warning "Considerações sobre Timeout"
    - **Muito baixo**: O navegador pode não inicializar completamente, causando falhas na inicialização
    - **Muito alto**: Travamentos bloquearão sua automação por mais tempo
    - **Recomendado**: 10-15s para a maioria dos casos, 20-30s para sistemas lentos ou perfis de navegador pesados

### Modo Headless (Sem Interface Gráfica)

Execute o navegador sem uma interface de usuário visível:

```python
options = ChromiumOptions()
options.headless = True  # Adiciona automaticamente o argumento --headless

# Ou manualmente
options.add_argument('--headless')
options.add_argument('--headless=new')  # Novo modo headless (Chrome 109+)
```

| Modo | Argumento | Descrição |
|---|---|---|
| **Headful** (Com UI) | (nenhum) | Janela do navegador visível (padrão) |
| **Headless Clássico** | `--headless` | Modo headless legado |
| **Novo Headless** | `--headless=new` | Modo headless moderno (Chrome 109+, melhor compatibilidade) |

!!! tip "Novo Modo Headless"
    O modo `--headless=new` (Chrome 109+) oferece melhor compatibilidade com recursos web modernos e é mais difícil de detectar. Use-o para automação em produção.

### Estado de Carregamento da Página

Controle quando o `tab.go_to()` considera uma página "carregada":

```python
from pydoll.constants import PageLoadState

options = ChromiumOptions()
options.page_load_state = PageLoadState.INTERACTIVE  # ou PageLoadState.COMPLETE
```

| Estado | Quando a Navegação Completa | Caso de Uso |
|---|---|---|
| `COMPLETE` (padrão) | Evento `load` disparado, todos os recursos carregados | Esperar por imagens, fontes, scripts |
| `INTERACTIVE` | `DOMContentLoaded` disparado, DOM pronto | Navegação mais rápida, interagir com o DOM imediatamente |

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions
from pydoll.constants import PageLoadState

async def compare_load_states():
    # Modo Complete - espera por tudo
    options_complete = ChromiumOptions()
    options_complete.page_load_state = PageLoadState.COMPLETE
    
    async with Chrome(options=options_complete) as browser:
        tab = await browser.start()
        
        import time
        start = time.time()
        await tab.go_to('https://example.com')
        complete_time = time.time() - start
        print(f"Modo COMPLETE: {complete_time:.2f}s")
    
    # Modo Interactive - DOM pronto é suficiente
    options_interactive = ChromiumOptions()
    options_interactive.page_load_state = PageLoadState.INTERACTIVE
    
    async with Chrome(options=options_interactive) as browser:
        tab = await browser.start()
        
        start = time.time()
        await tab.go_to('https://example.com')
        interactive_time = time.time() - start
        print(f"Modo INTERACTIVE: {interactive_time:.2f}s")

asyncio.run(compare_load_states())
```

!!! tip "Quando Usar INTERACTIVE"
    Use `INTERACTIVE` quando:
    
    - Você só precisa de acesso ao DOM, não de imagens/fontes
    - Raspagem de conteúdo de texto e estrutura
    - A velocidade é crítica
    - A página tem muitos recursos de carregamento lento
    
    Mantenha `COMPLETE` (padrão) quando:
    
    - Tirando screenshots (precisa de imagens carregadas)
    - Esperando aplicações pesadas em JavaScript inicializarem completamente
    - Testando o desempenho de carregamento da página

## Referência de Argumentos de Linha de Comando

O Chromium suporta centenas de "switches" de linha de comando. Abaixo estão os mais úteis para automação, organizados por categoria.

!!! info "Referência Completa"
    Lista completa de todos os switches do Chromium: [Switches de Linha de Comando do Chromium por Peter Beverloo](https://peter.sh/experiments/chromium-command-line-switches/)

### Desempenho e Gerenciamento de Recursos

Otimize o desempenho do navegador para uma automação mais rápida:

```python
options = ChromiumOptions()

# Desabilitar aceleração de GPU (headless, Docker, CI/CD)
options.add_argument('--disable-gpu')
options.add_argument('--disable-software-rasterizer')

# Reduzir uso de memória
options.add_argument('--disable-dev-shm-usage')  # Docker: supera o limite de tamanho do /dev/shm
options.add_argument('--disable-extensions')
options.add_argument('--disable-background-networking')

# Desabilitar recursos desnecessários
options.add_argument('--disable-sync')  # Sincronização de conta Google
options.add_argument('--disable-translate')
options.add_argument('--disable-background-timer-throttling')
options.add_argument('--disable-backgrounding-occluded-windows')
options.add_argument('--disable-renderer-backgrounding')

# Otimizações de rede
options.add_argument('--disable-features=NetworkPrediction')
options.add_argument('--dns-prefetch-disable')

# Janela e renderização
options.add_argument('--window-size=1920,1080')
options.add_argument('--window-position=0,0')
options.add_argument('--force-device-scale-factor=1')
```

| Argumento | Efeito | Quando Usar |
|---|---|---|
| `--disable-gpu` | Sem aceleração por GPU | Headless, Docker, servidores sem GPU |
| `--disable-dev-shm-usage` | Usar `/tmp` em vez de `/dev/shm` | Contêineres Docker com memória compartilhada pequena |
| `--disable-extensions` | Não carregar nenhuma extensão | Navegador limpo e rápido para automação |
| `--window-size=W,H` | Definir dimensões iniciais da janela | Screenshots, viewport consistente |
| `--force-device-scale-factor=1` | Desabilitar escalonamento high-DPI | Renderização consistente entre sistemas |

### Furtividade (Stealth) e Fingerprinting

Torne sua automação mais difícil de detectar com estes argumentos de linha de comando:

| Argumento | Propósito | Exemplo |
|---|---|---|
| `--disable-blink-features=AutomationControlled` | Remove a flag `navigator.webdriver` | Essencial para furtividade |
| `--user-agent=...` | Define um user agent realista e comum | Corresponder à região/dispositivo alvo |
| `--use-gl=swiftshader` | Renderizador WebGL por software | Evitar fingerprints de GPU únicos |
| `--force-webrtc-ip-handling-policy=...` | Prevenir vazamentos de IP via WebRTC | Usar `disable_non_proxied_udp` |
| `--lang=en-US` | Definir idioma do navegador | Corresponder ao locale alvo |
| `--accept-lang=en-US,en;q=0.9` | Cabeçalho Accept-Language | Preferências de idioma realistas |
| `--tz=America/New_York` | Definir fuso horário | Corresponder à região alvo |
| `--no-first-run` | Pular assistentes de primeira execução | Automação mais limpa |
| `--no-default-browser-check` | Pular aviso de navegador padrão | Evitar interrupções na UI |
| `--disable-reading-from-canvas` | Mitigação de fingerprinting de Canvas | Reduzir singularidade |
| `--disable-features=AudioServiceOutOfProcess` | Mitigação de fingerprinting de Áudio | Reduzir singularidade |

!!! warning "Corrida Armamentista da Detecção"
    Nenhuma técnica isolada garante a indetectabilidade. Combine múltiplas estratégias:
    
    1.  **Argumentos de linha de comando** (esta tabela)
    2.  **Preferências do navegador** - [Preferências do Navegador - Furtividade e Fingerprinting](browser-preferences.md#stealth-fingerprinting)
    3.  **Interações semelhantes a humanas** - [Interações Semelhantes a Humanas](../automation/human-interactions.md)
    4.  **Boa reputação de IP** - Use proxies residenciais com histórico limpo

### Segurança e Privacidade

Controle recursos de segurança e configurações de privacidade:

```python
options = ChromiumOptions()

# Sandbox (desabilite apenas para Docker/CI)
options.add_argument('--no-sandbox')  # RISCO DE SEGURANÇA - use apenas em ambientes controlados
options.add_argument('--disable-setuid-sandbox')

# HTTPS/SSL
options.add_argument('--ignore-certificate-errors')  # Ignorar erros SSL
options.add_argument('--ignore-ssl-errors')
options.add_argument('--allow-insecure-localhost')

# Privacidade
options.add_argument('--disable-features=Translate')
options.add_argument('--disable-sync')
options.add_argument('--incognito')  # Abrir em modo anônimo

# Concessão automática de permissões (para testes)
options.add_argument('--use-fake-ui-for-media-stream')  # Conceder automaticamente câmera/microfone
options.add_argument('--use-fake-device-for-media-stream')  # Usar dispositivos falsos
```

!!! danger "Avisos sobre o Sandbox"
    **`--no-sandbox` é um risco de segurança!** Use-o apenas quando:
    
    - Rodando em contêineres Docker (sandbox conflita com isolamento do contêiner)
    - Ambientes de CI/CD com permissões restritas
    - Você confia totalmente no conteúdo sendo carregado
    
    **Nunca** use `--no-sandbox` quando:
    
    - Visitando sites não confiáveis
    - Rodando código enviado por usuários
    - Em ambientes de produção com entrada externa

| Argumento | Efeito | Impacto na Segurança |
|---|---|---|
| `--no-sandbox` | Desabilita o sandbox do Chrome | **ALTO RISCO** - Permite execução de código |
| `--ignore-certificate-errors` | Pula validação SSL | **RISCO MÉDIO** - Possibilita ataques MITM |
| `--incognito` | Modo de navegação privada | Mais seguro - sem estado persistente |

### Depuração e Desenvolvimento

Ferramentas para depurar automação e desenvolvimento:

```python
options = ChromiumOptions()

# DevTools
options.add_argument('--auto-open-devtools-for-tabs')

# Logging
options.add_argument('--enable-logging')
options.add_argument('--v=1')  # Nível de verbosidade (0-3)
options.add_argument('--log-level=0')  # 0=INFO, 1=WARNING, 2=ERROR

# Tratamento de falhas
options.add_argument('--disable-crash-reporter')
options.add_argument('--no-crash-upload')

# Habilitar recursos experimentais
options.add_argument('--enable-features=NetworkService,NetworkServiceInProcess')
options.add_argument('--enable-experimental-web-platform-features')

# Depuração de JavaScript
options.add_argument('--js-flags=--expose-gc')  # Expõe o coletor de lixo
```

!!! tip "Depuração Remota"
    O Pydoll gerencia automaticamente a porta de depuração remota. Para acessar o Chrome DevTools:
    
    ```python
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Obter a porta de depuração
        port = browser._connection_port
        print(f"DevTools disponível em: http://localhost:{port}")
        
        # Abra esta URL no seu navegador para acessar o DevTools
    ```
    
    **Não** use o argumento `--remote-debugging-port` - ele entrará em conflito com o gerenciamento interno do Pydoll!

### Exibição e Renderização

Controle como o navegador renderiza o conteúdo:

```python
options = ChromiumOptions()

# Viewport e janela
options.add_argument('--window-size=1920,1080')
options.add_argument('--window-position=0,0')
options.add_argument('--start-maximized')
options.add_argument('--start-fullscreen')

# Telas High DPI
options.add_argument('--force-device-scale-factor=1')
options.add_argument('--high-dpi-support=1')

# Cor e renderização
options.add_argument('--force-color-profile=srgb')
options.add_argument('--disable-accelerated-2d-canvas')
options.add_argument('--disable-accelerated-video-decode')

# Renderização de fontes
options.add_argument('--font-render-hinting=none')
options.add_argument('--disable-font-subpixel-positioning')

# Animações
options.add_argument('--disable-animations')
options.add_argument('--wm-window-animations-disabled')
```

| Argumento | Efeito | Caso de Uso |
|---|---|---|
| `--window-size=W,H` | Define as dimensões da janela | Screenshots, viewport consistente |
| `--start-maximized` | Abre a janela maximizada | Testes de UI, capturas de tela cheia |
| `--force-device-scale-factor=1` | Desabilita escalonamento DPI | Renderização consistente entre sistemas |
| `--disable-animations` | Sem animações CSS/UI | Testes mais rápidos, reduz instabilidade |

### Configuração de Proxy

Configure proxies para todo o tráfego de rede:

```python
options = ChromiumOptions()

# Proxy HTTP/HTTPS
options.add_argument('--proxy-server=http://proxy.example.com:8080')

# Proxy autenticado
options.add_argument('--proxy-server=http://user:pass@proxy.example.com:8080')

# Proxy SOCKS
options.add_argument('--proxy-server=socks5://proxy.example.com:1080')

# Ignorar proxy para hosts específicos
options.add_argument('--proxy-bypass-list=localhost,127.0.0.1,*.local')

# Arquivo de auto-configuração de proxy (PAC)
options.add_argument('--proxy-pac-url=http://proxy.example.com/proxy.pac')
```

!!! info "Autenticação de Proxy"
    Para proxies que exigem autenticação, o Pydoll lida automaticamente com os desafios de autenticação ao usar o argumento `--proxy-server` com credenciais.
    
    Veja **[Interceptação de Requisições](../network/interception.md)** para detalhes sobre a interação do domínio Fetch com proxies.

## Métodos Auxiliares

`ChromiumOptions` fornece métodos convenientes para tarefas comuns de configuração:

### Gerenciamento de Downloads

```python
options = ChromiumOptions()

# Definir diretório de download
options.set_default_download_directory('/home/user/downloads')

# Perguntar pelo local de download
options.prompt_for_download = True  # Perguntar ao usuário onde salvar
options.prompt_for_download = False  # Baixar silenciosamente (padrão)

# Permitir múltiplos downloads automáticos
options.allow_automatic_downloads = True  # Permitir sem perguntar
options.allow_automatic_downloads = False  # Bloquear ou perguntar (padrão)
```

### Bloqueio de Conteúdo

```python
options = ChromiumOptions()

# Bloquear pop-ups
options.block_popups = True  # Bloquear (padrão na maioria dos casos)
options.block_popups = False  # Permitir

# Bloquear notificações
options.block_notifications = True  # Bloquear pedidos
options.block_notifications = False  # Permitir que sites perguntem
```

### Controles de Privacidade

```python
options = ChromiumOptions()

# Gerenciador de senhas
options.password_manager_enabled = False  # Desabilitar avisos de salvar senha
options.password_manager_enabled = True  # Habilitar (padrão)

# Proteção contra vazamento WebRTC (previne exposição do IP real via WebRTC)
options.webrtc_leak_protection = True  # Adiciona --force-webrtc-ip-handling-policy=disable_non_proxied_udp
options.webrtc_leak_protection = False  # Desabilitar (padrão)
```

!!! tip "Proteção contra Vazamento WebRTC"
    O WebRTC pode vazar seu endereço IP real mesmo quando estiver usando um proxy. Habilite `webrtc_leak_protection` para bloquear conexões UDP não proxyadas, impedindo que requisições STUN contornem seu proxy. Isso é **essencial** ao usar proxies para anonimato. Veja **[Fundamentos de Rede - WebRTC](../../deep-dive/network/network-fundamentals.md#webrtc-e-vazamento-de-ip)** para detalhes.

### Manuseio de Arquivos

```python
options = ChromiumOptions()

# Comportamento de PDF
options.open_pdf_externally = True  # Baixar PDFs em vez de visualizar
options.open_pdf_externally = False  # Visualizar no navegador (padrão)
```

### Internacionalização

```python
options = ChromiumOptions()

# Idiomas aceitos (afeta o cabeçalho Content-Language)
options.set_accept_languages('en-US,en;q=0.9,pt-BR;q=0.8')
```

## Exemplos de Configuração Completa

### Configuração para Raspagem Rápida

Otimizado para velocidade e eficiência de recursos:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions
from pydoll.constants import PageLoadState

def create_fast_scraping_options() -> ChromiumOptions:
    """Configuração ultrarrápida para web scraping."""
    options = ChromiumOptions()
    
    # Headless para velocidade
    options.headless = True
    
    # Carregamentos de página mais rápidos (DOM pronto é suficiente para scraping)
    options.page_load_state = PageLoadState.INTERACTIVE
    
    # Desabilitar recursos desnecessários
    options.add_argument('--disable-extensions')
    options.add_argument('--disable-gpu')
    options.add_argument('--disable-dev-shm-usage')
    options.add_argument('--disable-background-networking')
    options.add_argument('--disable-sync')
    options.add_argument('--disable-translate')
    
    # Bloquear conteúdo que retarda o carregamento
    options.block_notifications = True
    options.block_popups = True
    
    # Desabilitar imagens para carregamento ainda mais rápido (se você não precisar delas)
    options.add_argument('--blink-settings=imagesEnabled=false')
    
    # Otimizações de rede
    options.add_argument('--disable-features=NetworkPrediction')
    options.add_argument('--dns-prefetch-disable')
    
    return options

async def fast_scraping_example():
    options = create_fast_scraping_options()
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Navegação e raspagem super rápidas
        urls = ['https://example.com', 'https://example.org', 'https://example.net']
        
        for url in urls:
            await tab.go_to(url)
            title = await tab.execute_script('return document.title')
            print(f"{url}: {title}")

asyncio.run(fast_scraping_example())
```

### Configuração Completa de Furtividade (Stealth)

Para máxima indetectabilidade, combine argumentos de linha de comando com preferências do navegador:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

def create_full_stealth_options() -> ChromiumOptions:
    """Configuração completa de furtividade combinando argumentos e preferências."""
    options = ChromiumOptions()
    
    # ===== Argumentos de Linha de Comando =====
    
    # Furtividade principal
    options.add_argument('--disable-blink-features=AutomationControlled')
    options.add_argument('--disable-features=IsolateOrigins,site-per-process')
    
    # User agent (use um recente e comum)
    options.add_argument('--user-agent=Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/130.0.0.0 Safari/537.36')
    
    # Idioma e locale
    options.add_argument('--lang=en-US')
    options.add_argument('--accept-lang=en-US,en;q=0.9')
    
    # WebGL (renderizador por software para evitar assinaturas de GPU únicas)
    options.add_argument('--use-gl=swiftshader')
    options.add_argument('--disable-features=WebGLDraftExtensions')
    
    # Prevenção de vazamento de IP via WebRTC
    options.webrtc_leak_protection = True

    # Permissões e primeira execução
    options.add_argument('--no-first-run')
    options.add_argument('--no-default-browser-check')
    
    # Tamanho da janela (resolução comum)
    options.add_argument('--window-size=1920,1080')
    
    # ===== Preferências do Navegador =====
    # Para configuração abrangente de preferências do navegador, veja:
    # https://pydoll.tech/docs/features/configuration/browser-preferences/#stealth-fingerprinting
    
    return options

async def stealth_automation_example():
    options = create_full_stealth_options()
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Testar em sites de detecção de bots
        await tab.go_to('https://bot.sannysoft.com')
        await asyncio.sleep(5)
        
        # Sua automação aqui...

asyncio.run(stealth_automation_example())
```

!!! warning "Consistência do User-Agent é Crítica"
    Definir `--user-agent` altera apenas o **cabeçalho HTTP**, mas os sistemas de detecção também verificam `navigator.userAgent`, `navigator.platform`, `navigator.vendor` e outras propriedades JavaScript. **Inconsistências entre esses valores são um forte indicador de bot.**
    
    Por exemplo, se o seu User-Agent HTTP diz "Windows" mas o `navigator.platform` diz "Linux", você será sinalizado imediatamente.
    
    **Solução**: Você deve também sobrescrever as propriedades JavaScript via CDP para manter a consistência. Veja **[Fingerprinting do Navegador - Consistência do User-Agent](../../deep-dive/fingerprinting/browser-fingerprinting.md#user-agent-consistency)** para explicação detalhada e implementação usando `Page.addScriptToEvaluateOnNewDocument`.
    
    É por isso que a furtividade abrangente requer tanto argumentos de linha de comando QUANTO configuração de preferências do navegador.

!!! tip "Estratégia Completa de Furtividade"
    Argumentos de linha de comando são apenas parte da solução. Para máxima furtividade:
    
    1.  **Use os argumentos acima** (navigator.webdriver, WebGL, WebRTC)
    2.  **Configure as preferências do navegador** - Veja [Preferências do Navegador - Furtividade e Fingerprinting](browser-preferences.md#stealth-fingerprinting)
    3.  **Interações semelhantes a humanas** - Veja [Interações Semelhantes a Humanas](../automation/human-interactions.md)
    4.  **Boa reputação de IP/proxy** - Use proxies residenciais

### Configuração para Docker/CI

Para ambientes contêinerizados:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions
from pydoll.constants import PageLoadState

def create_docker_options() -> ChromiumOptions:
    """Configuração para contêineres Docker e CI/CD."""
    options = ChromiumOptions()
    
    # Necessário para Docker
    options.headless = True
    options.add_argument('--no-sandbox')  # Sandbox conflita com isolamento do contêiner
    options.add_argument('--disable-dev-shm-usage')  # Supera o limite de tamanho do /dev/shm
    
    # Estabilidade
    options.add_argument('--disable-gpu')
    options.add_argument('--disable-software-rasterizer')
    
    # Otimização de memória
    options.add_argument('--disable-extensions')
    options.add_argument('--disable-background-networking')
    
    # Carregamentos de página mais rápidos para CI
    options.page_load_state = PageLoadState.INTERACTIVE
    
    # Aumentar timeout para runners de CI lentos
    options.start_timeout = 20
    
    # Tratamento de falhas
    options.add_argument('--disable-crash-reporter')
    
    return options

async def ci_testing_example():
    options = create_docker_options()
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Rode seus testes...
        await tab.go_to('https://example.com')
        assert await tab.execute_script('return document.title') == 'Example Domain'

asyncio.run(ci_testing_example())
```

## Solução de Problemas

### O Navegador Não Inicia

```python
# Aumente o timeout
options.start_timeout = 30

# Verifique a localização do binário
options.binary_location = '/path/to/chrome'

# Problemas com Docker/CI
options.add_argument('--no-sandbox')
options.add_argument('--disable-dev-shm-usage')
```

### Desempenho Lento

```python
# Desabilite a GPU se não for necessária
options.add_argument('--disable-gpu')

# Desabilite imagens
options.add_argument('--blink-settings=imagesEnabled=false')

# Use o estado de carregamento INTERACTIVE
options.page_load_state = PageLoadState.INTERACTIVE

# Desabilite recursos desnecessários
options.add_argument('--disable-extensions')
options.add_argument('--disable-background-networking')
```

### Problemas de Memória no Docker

```python
# Essencial para Docker
options.add_argument('--disable-dev-shm-usage')

# Reduzir consumo de memória
options.add_argument('--disable-extensions')
options.add_argument('--disable-gpu')
options.add_argument('--single-process')  # Último recurso (pode ser instável)
```

## Leitura Adicional

- **[Preferências do Navegador](browser-preferences.md)** - Sistema interno de preferências do Chromium
- **[Automação Furtiva](../automation/human-interactions.md)** - Interações semelhantes a humanas
- **[Contextos](../browser-management/contexts.md)** - Contextos de navegação isolados
- **[Interceptação de Rede](../network/interception.md)** - Manipulação de requisições/respostas

!!! tip "Experimentação é Chave"
    A configuração do navegador é altamente dependente do seu caso de uso específico. Comece com os exemplos aqui, depois ajuste com base em suas necessidades. Use `browser._connection_port` para acessar o DevTools e inspecionar o que está acontecendo dentro do navegador.

================================================
FILE: docs/pt/features/configuration/browser-preferences.md
================================================
# Preferências Personalizadas do Navegador

Uma das funcionalidades mais poderosas do Pydoll é o acesso direto ao sistema interno de preferências do Chromium. Diferente das ferramentas tradicionais de automação de navegador que expõem apenas um conjunto limitado de opções, o Pydoll oferece o mesmo nível de controle que extensões e administradores corporativos têm, permitindo que você configure **qualquer** configuração de navegador disponível no código-fonte do Chromium.

## Por que as Preferências do Navegador Importam

As preferências do navegador controlam cada aspecto de como o Chromium se comporta:

- **Desempenho**: Desabilite recursos que você não precisa para carregamentos de página mais rápidos
- **Privacidade**: Controle quais dados o navegador coleta e envia
- **Automação**: Remova prompts e confirmações do usuário que quebram fluxos de trabalho
- **Furtividade (Stealth)**: Crie fingerprints de navegador realistas para evitar detecção
- **Corporativo**: Aplique políticas tipicamente disponíveis apenas através de Política de Grupo (Group Policy)

!!! info "O Poder do Acesso Direto"
    A maioria das ferramentas de automação expõe apenas 10-20 configurações comuns. O Pydoll lhe dá acesso a **centenas** de preferências, desde o comportamento de download até sugestões de busca, da predição de rede ao gerenciamento de plugins. Se o Chromium pode fazer, você pode configurar.

## Guia Rápido

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def preferences_example():
    options = ChromiumOptions()
    
    # Definir preferências usando um dict
    options.browser_preferences = {
        'download': {
            'default_directory': '/tmp/downloads',
            'prompt_for_download': False
        },
        'profile': {
            'default_content_setting_values': {
                'notifications': 2  # Bloquear notificações
            }
        }
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # Downloads vão para /tmp/downloads automaticamente
        # Nenhum prompt de notificação aparecerá

asyncio.run(preferences_example())
```

## Entendendo as Preferências do Navegador

### O que são Preferências?

O Chromium armazena todas as configurações configuráveis pelo usuário em um arquivo JSON chamado `Preferences`, localizado no diretório de dados do usuário do navegador. Este arquivo contém **tudo**, desde a URL da sua página inicial até se as imagens carregam automaticamente.

**Localização típica:**

- **Linux**: `~/.config/google-chrome/Default/Preferences`
- **macOS**: `~/Library/Application Support/Google/Chrome/Default/Preferences`
- **Windows**: `%LOCALAPPDATA%\Google\Chrome\User Data\Default\Preferences`

### Estrutura do Arquivo de Preferências

O arquivo Preferences é um objeto JSON aninhado:

```json
{
  "download": {
    "default_directory": "/home/user/Downloads",
    "prompt_for_download": true
  },
  "profile": {
    "default_content_setting_values": {
      "notifications": 1,
      "popups": 0
    },
    "password_manager_enabled": true
  },
  "search": {
    "suggest_enabled": true
  },
  "net": {
    "network_prediction_options": 1
  }
}
```

Cada nome de preferência separado por pontos no código-fonte do Chromium mapeia para um caminho JSON aninhado:

- `download.default_directory` → `{'download': {'default_directory': ...}}`
- `profile.password_manager_enabled` → `{'profile': {'password_manager_enabled': ...}}`

### Como o Chromium Usa as Preferências

Quando o Chromium inicia:

1.  **Lê** o arquivo Preferences do disco
2.  **Aplica** essas configurações para configurar o comportamento do navegador
3.  **Atualiza** o arquivo quando os usuários alteram configurações via UI
4.  **Recorre aos padrões** se as preferências estiverem ausentes

O Pydoll intercepta o passo 1 pré-populando o arquivo Preferences antes do navegador iniciar, garantindo que suas configurações personalizadas sejam aplicadas desde o primeiro carregamento da página.

## Como Funciona no Pydoll

### Definindo Preferências

Use a propriedade `browser_preferences` para definir qualquer preferência:

```python
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()

# Atribuição direta - mescla com preferências existentes
options.browser_preferences = {
    'download': {'default_directory': '/tmp'},
    'intl': {'accept_languages': 'pt-BR,en-US'}
}

# Múltiplas atribuições são mescladas, não substituídas
options.browser_preferences = {
    'profile': {'password_manager_enabled': False}
}

# Ambos os conjuntos de preferências estão agora ativos
```

!!! warning "Preferências São Mescladas, Não Substituídas"
    Quando você define `browser_preferences` múltiplas vezes, as novas preferências são **mescladas** com as existentes. Apenas as chaves específicas que você define são atualizadas; todo o resto é preservado.
    
    ```python
    options.browser_preferences = {'download': {'prompt': False}}
    options.browser_preferences = {'profile': {'password_manager_enabled': False}}
    
    # Resultado: AMBAS as preferências são definidas
    # {'download': {'prompt': False}, 'profile': {'password_manager_enabled': False}}
    ```

### Sintaxe de Caminho Aninhado

As preferências usam dicionários aninhados que espelham a notação de pontos do Chromium:

```python
# Constante do código-fonte do Chromium:
# const char kDownloadDefaultDirectory[] = "download.default_directory";

# Traduz para dict Python:
options.browser_preferences = {
    'download': {
        'default_directory': '/path/to/downloads'
    }
}
```

Quanto mais profundo o aninhamento, mais específica a preferência:

```python
# Nível superior: profile
# Segundo nível: default_content_setting_values  
# Terceiro nível: notifications

options.browser_preferences = {
    'profile': {
        'default_content_setting_values': {
            'notifications': 2,  # Bloquear
            'geolocation': 2,    # Bloquear
            'media_stream': 2    # Bloquear
        }
    }
}
```

## Casos de Uso Práticos

### 1. Otimização de Desempenho

Desabilite recursos que consomem muitos recursos para automação mais rápida:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def performance_optimized_browser():
    options = ChromiumOptions()
    options.browser_preferences = {
        # Desabilitar predição de rede e prefetching
        'net': {
            'network_prediction_options': 2  # 2 = Nunca prever
        },
        # Desabilitar carregamento de imagens
        'profile': {
            'default_content_setting_values': {
                'images': 2  # 2 = Bloquear, 1 = Permitir
            }
        },
        # Desabilitar plugins
        'webkit': {
            'webprefs': {
                'plugins_enabled': False
            }
        },
        # Desabilitar verificação ortográfica
        'browser': {
            'enable_spellchecking': False
        }
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Páginas carregam 3-5x mais rápido sem imagens e recursos desnecessários
        await tab.go_to('https://example.com')
        print("Carregamento rápido completo!")

asyncio.run(performance_optimized_browser())
```

!!! tip "Impacto no Desempenho"
    Apenas desabilitar imagens pode reduzir o tempo de carregamento da página em 50-70% para sites pesados em imagens. Combine com a desabilitação de prefetch, verificação ortográfica e plugins para velocidade máxima.

### 2. Privacidade e Anti-Rastreamento

Crie uma configuração de navegador focada em privacidade:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def privacy_focused_browser():
    options = ChromiumOptions()
    options.browser_preferences = {
        # Habilitar Do Not Track
        'enable_do_not_track': True,
        
        # Desabilitar referrers
        'enable_referrers': False,
        
        # Desabilitar Safe Browsing (envia URLs para o Google)
        'safebrowsing': {
            'enabled': False
        },
        
        # Desabilitar gerenciador de senhas
        'profile': {
            'password_manager_enabled': False
        },
        
        # Desabilitar preenchimento automático
        'autofill': {
            'enabled': False,
            'profile_enabled': False
        },
        
        # Desabilitar sugestões de busca (envia consultas para o motor de busca)
        'search': {
            'suggest_enabled': False
        },
        
        # Desabilitar telemetria e métricas
        'user_experience_metrics': {
            'reporting_enabled': False
        },
        
        # Bloquear cookies de terceiros
        'profile': {
            'block_third_party_cookies': True,
            'cookie_controls_mode': 1
        }
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        print("Navegador focado em privacidade pronto!")

asyncio.run(privacy_focused_browser())
```

### 3. Downloads Silenciosos

Automatize downloads de arquivos sem interação do usuário:

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def silent_download_automation():
    download_dir = Path.home() / 'automation_downloads'
    download_dir.mkdir(exist_ok=True)
    
    options = ChromiumOptions()
    options.browser_preferences = {
        'download': {
            'default_directory': str(download_dir),
            'prompt_for_download': False,
            'directory_upgrade': True
        },
        'profile': {
            'default_content_setting_values': {
                'automatic_downloads': 1  # 1 = Permitir, 2 = Bloquear
            }
        },
        # Sempre baixar PDFs em vez de abrir no visualizador
        'plugins': {
            'always_open_pdf_externally': True
        }
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/downloads')
        
        # Clicar em links de download - arquivos salvam automaticamente
        download_link = await tab.find(text='Download Report')
        await download_link.click()
        
        await asyncio.sleep(3)
        print(f"Arquivo baixado para: {download_dir}")

asyncio.run(silent_download_automation())
```

### 4. Bloquear Elementos de UI Intrusivos

Remova popups, notificações e prompts que quebram a automação:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def clean_ui_browser():
    options = ChromiumOptions()
    options.browser_preferences = {
        'profile': {
            'default_content_setting_values': {
                'notifications': 2,      # Bloquear notificações
                'popups': 0,             # Bloquear popups
                'geolocation': 2,        # Bloquear requisições de localização
                'media_stream': 2,       # Bloquear acesso à câmera/microfone
                'media_stream_mic': 2,   # Bloquear microfone
                'media_stream_camera': 2 # Bloquear câmera
            }
        },
        # Desabilitar prompts de tradução
        'translate': {
            'enabled': False
        },
        # Desabilitar prompt de salvar senha
        'credentials_enable_service': False,
        
        # Desabilitar infobar "O Chrome está sendo controlado por automação"
        'devtools': {
            'preferences': {
                'currentDockState': '"undocked"'
            }
        }
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        # Sem popups, sem prompts, automação limpa!

asyncio.run(clean_ui_browser())
```

### 5. Internacionalização e Localização

Configure preferências de idioma e localidade:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def localized_browser():
    options = ChromiumOptions()
    options.browser_preferences = {
        # Idiomas aceitos (ordem de prioridade)
        'intl': {
            'accept_languages': 'pt-BR,pt,en-US,en'
        },
        
        # Idiomas da verificação ortográfica
        'spellcheck': {
            'dictionaries': ['pt-BR', 'en-US']
        },
        
        # Configurações de tradução
        'translate': {
            'enabled': True
        },
        'translate_blocked_languages': ['en'],  # Não oferecer para traduzir Inglês
        
        # Codificação de caracteres padrão
        'default_charset': 'UTF-8'
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        # Navegador configurado para Português do Brasil

asyncio.run(localized_browser())
```

## Métodos Auxiliares

Para cenários comuns, o Pydoll fornece métodos de conveniência:

```python
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()

# Gerenciamento de download
options.set_default_download_directory('/tmp/downloads')
options.prompt_for_download = False
options.allow_automatic_downloads = True
options.open_pdf_externally = True

# Bloqueio de conteúdo
options.block_notifications = True
options.block_popups = True

# Privacidade
options.password_manager_enabled = False

# Internacionalização
options.set_accept_languages('pt-BR,en-US,en')
```

Esses métodos são atalhos que definem as preferências aninhadas corretas para você:

```python
# Este auxiliar:
options.set_default_download_directory('/tmp')

# É equivalente a:
options.browser_preferences = {
    'download': {
        'default_directory': '/tmp'
    }
}
```

!!! tip "Combine Auxiliares com Preferências Diretas"
    Use auxiliares para configurações comuns e `browser_preferences` para configurações avançadas:
    
    ```python
    # Comece com auxiliares
    options.block_notifications = True
    options.prompt_for_download = False
    
    # Adicione preferências avançadas
    options.browser_preferences = {
        'net': {'network_prediction_options': 2},
        'webkit': {'webprefs': {'plugins_enabled': False}}
    }
    ```

## Encontrando Preferências no Código-Fonte do Chromium

### Referência do Código-Fonte

O Chromium define todas as constantes de preferência em `pref_names.cc`:

**Fonte oficial**: [chromium/src/+/main/chrome/common/pref_names.cc](https://chromium.googlesource.com/chromium/src/+/main/chrome/common/pref_names.cc)

### Lendo o Código-Fonte

As constantes de preferência usam notação de pontos que mapeia diretamente para dicts aninhados:

```cpp
// Do código-fonte do Chromium (pref_names.cc):
const char kDownloadDefaultDirectory[] = "download.default_directory";
const char kPromptForDownload[] = "download.prompt_for_download";
const char kSafeBrowsingEnabled[] = "safebrowsing.enabled";
const char kBlockThirdPartyCookies[] = "profile.block_third_party_cookies";
```

**Converte para Python:**

```python
options.browser_preferences = {
    'download': {
        'default_directory': '/path/to/dir',
        'prompt_for_download': False
    },
    'safebrowsing': {
        'enabled': False
    },
    'profile': {
        'block_third_party_cookies': True
    }
}
```

### Processo de Descoberta

1.  **Pesquise no código-fonte**: Vá para [pref_names.cc](https://chromium.googlesource.com/chromium/src/+/main/chrome/common/pref_names.cc)
2.  **Encontre sua preferência**: Pesquise por palavras-chave (ex: "download", "password", "notification")
3.  **Anote o nome da constante**: ex: `kDownloadDefaultDirectory[] = "download.default_directory"`
4.  **Converta para dict**: Divida pelos pontos e crie a estrutura aninhada

**Exemplo - Encontrando preferências de notificação:**

```cpp
// Pesquise por "notification" em pref_names.cc:
const char kPushMessagingAppIdentifierMap[] = 
    "gcm.push_messaging_application_id_map";
const char kDefaultNotificationsSetting[] = 
    "profile.default_content_setting_values.notifications";
```

```python
# Torna-se:
options.browser_preferences = {
    'profile': {
        'default_content_setting_values': {
            'notifications': 2  # 2 = bloquear, 1 = permitir, 0 = perguntar
        }
    }
}
```

### Padrões Comuns de Preferência

| Categoria | Exemplo de Constante | Caminho do Dict Python |
|---|---|---|
| Downloads | `download.default_directory` | `{'download': {'default_directory': ...}}` |
| Config. de Conteúdo | `profile.default_content_setting_values.X` | `{'profile': {'default_content_setting_values': {'X': ...}}}` |
| Rede | `net.network_prediction_options` | `{'net': {'network_prediction_options': ...}}` |
| Privacidade | `safebrowsing.enabled` | `{'safebrowsing': {'enabled': ...}}` |
| Sessão | `session.restore_on_startup` | `{'session': {'restore_on_startup': ...}}` |

!!! warning "Preferências Não Documentadas"
    Nem todas as preferências estão documentadas. Algumas são:
    
    - **Experimentais**: Podem mudar ou ser removidas em futuras versões do Chromium
    - **Internas**: Usadas pelos sistemas internos do Chromium
    - **Específicas da plataforma**: Funcionam apenas em certos sistemas operacionais
    
    Teste exaustivamente antes de confiar em preferências não documentadas.

## Referência de Preferências Úteis

Aqui está uma lista selecionada de preferências interessantes e úteis do `pref_names.cc` do Chromium:

### Configurações de Conteúdo e Mídia

```python
options.browser_preferences = {
    'profile': {
        'default_content_setting_values': {
            # Controle de conteúdo (0=perguntar, 1=permitir, 2=bloquear)
            'cookies': 1,                    # Permitir cookies
            'images': 1,                     # Permitir imagens (2 para bloquear)
            'javascript': 1,                 # Permitir JavaScript (2 para bloquear)
            'plugins': 2,                    # Bloquear plugins (Flash, etc.)
            'popups': 0,                     # Bloquear popups
            'geolocation': 2,                # Bloquear requisições de localização
            'notifications': 2,              # Bloquear notificações
            'media_stream': 2,               # Bloquear câmera/microfone
            'media_stream_mic': 2,           # Bloquear apenas microfone
            'media_stream_camera': 2,        # Bloquear apenas câmera
            'automatic_downloads': 1,        # Permitir downloads automáticos
            'midi_sysex': 2,                 # Bloquear acesso MIDI
            'clipboard': 1,                  # Permitir acesso à área de transferência
            'sensors': 2,                    # Bloquear sensores de movimento
            'usb_guard': 2,                  # Bloquear acesso a dispositivos USB
            'serial_guard': 2,               # Bloquear acesso à porta serial
            'bluetooth_guard': 2,            # Bloquear Bluetooth
            'file_system_write_guard': 2,    # Bloquear escrita no sistema de arquivos
        }
    }
}
```

### Rede e Desempenho

```python
options.browser_preferences = {
    'net': {
        # Predição de rede: 0=sempre, 1=apenas wifi, 2=nunca
        'network_prediction_options': 2,
        
        # Verificação rápida de alcançabilidade do servidor
        'quick_check_enabled': False
    },
    
    # Prefetching de DNS
    'dns_prefetching': {
        'enabled': False  # Desabilitar para reduzir tráfego de rede
    },
    
    # Pré-conectar a resultados de busca
    'search': {
        'suggest_enabled': False,           # Desabilitar sugestões de busca
        'instant_enabled': False            # Desabilitar resultados instantâneos
    },
    
    # Páginas de erro alternativas
    'alternate_error_pages': {
        'enabled': False  # Não sugerir alternativas para 404s
    }
}
```

### Preferências de Download

```python
options.browser_preferences = {
    'download': {
        'default_directory': '/path/to/downloads',
        'prompt_for_download': False,
        'directory_upgrade': True,
        'extensions_to_open': '',           # Tipos de arquivo para abrir automaticamente
        'open_pdf_externally': True,        # Não usar o visualizador de PDF interno
    },
    
    'download_bubble': {
        'partial_view_enabled': True        # Mostrar balão de progresso do download
    },
    
    'safebrowsing': {
        'enabled': False  # Desabilitar avisos de download do Safe Browsing
    }
}
```

### Privacidade e Segurança

```python
options.browser_preferences = {
    # Do Not Track
    'enable_do_not_track': True,
    
    # Referrers
    'enable_referrers': False,
    
    # Safe Browsing
    'safebrowsing': {
        'enabled': False,                   # Desabilitar Safe Browsing
        'enhanced': False                   # Desabilitar proteção avançada
    },
    
    # Privacy Sandbox (substituto de cookies do Google)
    'privacy_sandbox': {
        'apis_enabled': False,
        'topics_enabled': False,
        'fledge_enabled': False
    },
    
    # Cookies de terceiros
    'profile': {
        'block_third_party_cookies': True,
        'cookie_controls_mode': 1,          # Bloquear terceiros no modo anônimo
        
        # Configurações de conteúdo
        'default_content_setting_values': {
            'cookies': 1,
            'third_party_cookie_blocking_enabled': True
        }
    },
    
    # WebRTC (pode vazar IP real)
    'webrtc': {
        'ip_handling_policy': 'default_public_interface_only',
        'multiple_routes_enabled': False,
        'nonproxied_udp_enabled': False
    }
}
```

### Preenchimento Automático e Senhas

```python
options.browser_preferences = {
    'autofill': {
        'enabled': False,                   # Desabilitar preenchimento automático de formulários
        'profile_enabled': False,           # Desabilitar preenchimento automático de endereço
        'credit_card_enabled': False,       # Desabilitar preenchimento automático de cartão de crédito
        'credit_card_fido_auth_enabled': False
    },
    
    'profile': {
        'password_manager_enabled': False,
        'password_manager_leak_detection': False
    },
    
    'credentials_enable_service': False,
    'credentials_enable_autosignin': False
}
```

### Comportamento do Navegador e UI

```python
import time

options.browser_preferences = {
    # Página inicial e inicialização
    'homepage': 'https://www.google.com',
    'homepage_is_newtabpage': False,
    'newtab_page_location_override': 'https://www.google.com',
    
    'session': {
        'restore_on_startup': 1,            # 0=nova aba, 1=restaurar, 4=URLs específicas, 5=página nova aba
        'startup_urls': ['https://www.google.com'],
        'session_data_status': 3            # Status dos dados da sessão (interno)
    },
    
    # Página de boas-vindas e janela
    'browser': {
        'has_seen_welcome_page': True,      # Pular tela de boas-vindas
        'window_placement': {
            'bottom': 1032,                 # Posição inferior da janela
            'left': 2247,                   # Posição esquerda da janela
            'right': 3192,                  # Posição direita da janela
            'top': 31,                      # Posição superior da janela
            'maximized': False,             # Janela está maximizada
            'work_area_bottom': 1080,       # Área de trabalho inferior da tela
            'work_area_left': 1920,         # Área de trabalho esquerda da tela
            'work_area_right': 3840,        # Área de trabalho direita da tela
            'work_area_top': 0              # Área de trabalho superior da tela
        }
    },
    
    # Extensões
    'extensions': {
        'ui': {
            'developer_mode': False
        },
        'alerts': {
            'initialized': True
        },
        'theme': {
            'system_theme': 2               # 0=padrão, 1=claro, 2=escuro
        },
        'last_chrome_version': '130.0.6723.91'  # Deve corresponder à sua versão
    },
    
    # Tradução
    'translate': {
        'enabled': False                    # Desabilitar prompts de tradução
    },
    'translate_blocked_languages': ['en'],  # Nunca oferecer para traduzir Inglês
    'translate_site_blacklist': [],         # Legado (use blocklist_with_time)
    
    # Barra de favoritos
    'bookmark_bar': {
        'show_on_all_tabs': False
    },
    
    # Abas
    'tabs': {
        'new_tab_position': 0               # 0=à direita, 1=após atual
    },
    'pinned_tabs': [],                      # Lista de URLs de abas fixadas
    
    # Página Nova Aba (timestamps em formato Chrome)
    'NewTabPage': {
        'PrevNavigationTime': str(int(time.time() * 1000000) + 11644473600000000)  # Timestamp do Chrome
    },
    'ntp': {
        'num_personal_suggestions': 6       # Número de sugestões (0-10)
    },
    
    # Personalização da barra de ferramentas
    'toolbar': {
        'pinned_chrome_labs_migration_complete': True
    }
}
```

!!! info "Formato de Timestamp do Chrome"
    O Chrome usa o formato Windows FILETIME: microssegundos desde 1º de janeiro de 1601 UTC.
    
    Converter timestamp do Python:
    ```python
    import time
    chrome_time = int(time.time() * 1000000) + 11644473600000000
    ```

### Ortografia e Idioma

```python
options.browser_preferences = {
    'browser': {
        'enable_spellchecking': False       # Desabilitar verificação ortográfica
    },
    
    'spellcheck': {
        'dictionaries': ['en-US', 'pt-BR'], # Idiomas da verificação ortográfica
        'dictionary': '',                   # Preferência legada (manter vazio)
        'use_spelling_service': False       # Não enviar ao Google
    },
    
    'intl': {
        'accept_languages': 'pt-BR,pt,en-US,en',
        'selected_languages': 'pt-BR,pt,en-US,en'  # Selecionados explicitamente
    },
    
    # Comportamento e histórico de tradução
    'translate': {
        'enabled': True
    },
    'translate_accepted_count': {
        'pt-BR': 0,
        'es': 5                             # Aceitou 5 traduções de espanhol
    },
    'translate_denied_count_for_language': {
        'en': 10                            # Nunca traduzir inglês
    },
    'translate_ignored_count_for_language': {
        'en': 1
    },
    'translate_site_blocklist_with_time': {},  # Sites para nunca traduzir
    
    # Idioma das legendas de acessibilidade
    'accessibility': {
        'captions': {
            'live_caption_language': 'pt-BR'
        }
    },
    
    # Contadores do modelo de idioma (estatísticas de uso)
    'language_model_counters': {
        'en': 2,                            # Contagem de palavras em inglês
        'pt': 10                            # Contagem de palavras em português
    }
}
```

!!! info "Contadores do Modelo de Idioma"
    Esses contadores rastreiam estatísticas de uso de idioma para os modelos de aprendizado de máquina do Chrome:
    
    - Usados para prever as preferências de idioma do usuário
    - Afeta sugestões de busca e autocompletar
    - Contagens mais altas indicam uso mais frequente
    - Valores realistas: 0-1000 para uso ocasional, 1000+ para uso intenso

### Acessibilidade

```python
options.browser_preferences = {
    'accessibility': {
        'image_labels_enabled': False       # Não obter legendas de imagem do Google
    },
    
    # Configurações de fonte
    'webkit': {
        'webprefs': {
            'default_font_size': 16,
            'default_fixed_font_size': 13,
            'minimum_font_size': 0,
            'minimum_logical_font_size': 6,
            'fonts': {
                'standard': {
                    'Zyyy': 'Arial'
                },
                'serif': {
                    'Zyyy': 'Times New Roman'
                }
            }
        }
    }
}
```

### Mídia e Áudio

```python
options.browser_preferences = {
    # Áudio
    'audio': {
        'mute_enabled': False               # Iniciar com áudio ligado/desligado
    },
    
    # Autoplay
    'media': {
        'autoplay_policy': 0,               # 0=permitir, 1=gesto do usuário, 2=ativação do usuário no documento
        'video_fullscreen_orientation_lock': False
    },
    
    # WebGL
    'webkit': {
        'webprefs': {
            'webgl_enabled': True,          # Habilitar/desabilitar WebGL
            'webgl2_enabled': True
        }
    }
}
```

### Impressão

```python
options.browser_preferences = {
    'printing': {
        'print_preview_sticky_settings': {
            'appState': '{\"version\":2,\"recentDestinations\":[{\"id\":\"Save as PDF\",\"origin\":\"local\"}],\"marginsType\":3,\"customMargins\":{\"marginTop\":63,\"marginRight\":192,\"marginBottom\":240,\"marginLeft\":260}}'
        }
    },
    
    'savefile': {
        'default_directory': '/tmp'         # Local padrão para salvar PDFs
    }
}
```

!!! tip "Formato appState da Impressão"
    O `appState` é uma string codificada em JSON. Para manipulação mais fácil:
    
    ```python
    import json
    
    app_state = {
        'version': 2,
        'recentDestinations': [{
            'id': 'Save as PDF',
            'origin': 'local'
        }],
        'marginsType': 3,                   # 0=padrão, 1=sem margens, 2=mínimo, 3=personalizado
        'customMargins': {
            'marginTop': 63,
            'marginRight': 192,
            'marginBottom': 240,
            'marginLeft': 260
        },
        'isHeaderFooterEnabled': False,
        'scaling': '100',
        'scalingType': 3,                   # 0=padrão, 1=ajustar à página, 2=ajustar ao papel, 3=personalizado
        'isColorEnabled': True,
        'isDuplexEnabled': False,
        'isCssBackgroundEnabled': True,
        'dpi': {
            'horizontal_dpi': 300,
            'vertical_dpi': 300,
            'is_default': True
        },
        'mediaSize': {
            'name': 'ISO_A4',
            'width_microns': 210000,
            'height_microns': 297000,
            'custom_display_name': 'A4',
            'is_default': True
        }
    }
    
    # Converter para string para o appState
    options.browser_preferences = {
        'printing': {
            'print_preview_sticky_settings': {
                'appState': json.dumps(app_state)
            }
        }
    }
    ```

### WebRTC e Peer-to-Peer

```python
options.browser_preferences = {
    'webrtc': {
        # Política de manuseio de IP
        'ip_handling_policy': 'default_public_interface_only',
        
        # Opções de transporte UDP
        'udp_port_range': '10000-10100',    # Restringir intervalo de portas UDP
        
        # Desabilitar peer-to-peer
        'multiple_routes_enabled': False,
        'nonproxied_udp_enabled': False,
        
        # Coleta de log de texto
        'text_log_collection_allowed': False
    }
}
```

### Isolamento de Site e Segurança

```python
options.browser_preferences = {
    # Isolamento de site
    'site_isolation': {
        'isolate_origins': '',              # Origens separadas por vírgula para isolar
        'site_per_process': True            # Isolamento total de site
    },
    
    # Conteúdo misto
    'mixed_content': {
        'auto_upgrade_enabled': True        # Atualizar HTTP para HTTPS
    },
    
    # SSL/TLS
    'ssl': {
        'rev_checking': {
            'enabled': True                 # Verificar revogação de certificado
        }
    }
}
```

### Metadados de Instalação e País

```python
import uuid
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.browser_preferences = {
    # ID do país na instalação (afeta config. padrão e localidade)
    'countryid_at_install': 16978,          # Varia por país (ex: 16978 para Brasil)
    
    # Estado de instalação de aplicativos padrão
    'default_apps_install_state': 3,        # 0=não inst., 1=inst., 3=migrado
    
    # GUID do perfil corporativo (para navegadores gerenciados)
    'enterprise_profile_guid': str(uuid.uuid4()),
    
    # Provedor de busca padrão
    'default_search_provider': {
        'guid': ''                          # Vazio para padrão (Google)
    }
}
```

!!! info "Valores de ID de País"
    `countryid_at_install` é um código numérico que representa o país onde o Chrome foi instalado pela primeira vez:
    
    - **16978**: Brasil (BR)
    - **16965**: Estados Unidos (US)
    - **16967**: Grã-Bretanha (GB)
    - **16966**: Alemanha (DE)
    - **16972**: Japão (JP)
    - E muitos outros...
    
    Isso afeta o idioma padrão, moeda e configurações regionais. Para um fingerprinting realista, combine isso com sua região alvo.

### Recursos Experimentais

```python
options.browser_preferences = {
    # Experimentos do Chrome Labs
    'browser': {
        'labs': {
            'enabled': False
        }
    },
    
    # Pré-carregamento
    'preload': {
        'enabled': False                    # Desabilitar pré-carregamento de página
    },
    
    # Rolagem suave
    'smooth_scrolling': {
        'enabled': True
    },
    
    # Aceleração de hardware
    'hardware_acceleration_mode': {
        'enabled': True                     # Desabilitar para desempenho headless
    }
}
```

### DevTools e Opções de Desenvolvedor

```python
options.browser_preferences = {
    'devtools': {
        'preferences': {
            # Aparência do DevTools
            'currentDockState': '"right"',              # "bottom", "right", "undocked"
            'uiTheme': '"dark"',                        # "dark", "light", "system"
            
            # Configurações do Console
            'consoleTimestampsEnabled': 'true',
            'preserveConsoleLog': 'true',
            
            # Painel de Rede
            'network.disableCache': 'false',
            'network.color-code-resource-types': 'true',
            'network-panel-split-view-state': '{"vertical":{"size":0}}',
            
            # Mapas de origem
            'cssSourceMapsEnabled': 'true',
            'jsSourceMapsEnabled': 'true',
            
            # Painel de Elementos
            'elements.styles.sidebar.width': '{"vertical":{"size":0,"showMode":"OnlyMain"}}',
            
            # Versionamento do Inspetor
            'inspectorVersion': '37',
            
            # Painel selecionado
            'panel-selected-tab': '"network"',          # Último painel aberto
            
            # Categorias expandidas de info de requisição
            'request-info-general-category-expanded': 'true',
            'request-info-request-headers-category-expanded': 'true',
            'request-info-response-headers-category-expanded': 'true'
        },
        'synced_preferences_sync_disabled': {
            'adorner-settings': '[{"adorner":"grid","isEnabled":true},{"adorner":"flex","isEnabled":true}]',
            'syncedInspectorVersion': '37'
        }
    },
    
    # GCM (Google Cloud Messaging)
    'gcm': {
        'product_category_for_subtypes': 'com.chrome.linux'  # com.chrome.windows, com.chrome.macos
    }
}
```

!!! tip "Formato das Preferências do DevTools"
    As preferências do DevTools usam um formato único onde valores booleanos e strings são armazenados como **strings codificadas em JSON** (ex: `'true'` em vez de `True`, `'"dark"'` em vez de `'dark'`). Isso ocorre porque as configurações do DevTools são serializadas diretamente para JSON.
    
    Para objetos complexos, codifique duas vezes:
    ```python
    import json
    
    # Crie o objeto
    split_view = {'vertical': {'size': 0}}
    
    # Codifique duas vezes para o DevTools
    devtools_value = json.dumps(json.dumps(split_view))
    # Resultado: '"{\\"vertical\\":{\\"size\\":0}}"'
    ```

### Controle de Sincronização e Login

```python
import time
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.browser_preferences = {
    'signin': {
        'allowed': True,                        # Permitir login no Google
        'cookie_clear_on_exit_migration_notice_complete': True
    },
    
    'sync': {
        'data_type_status_for_sync_to_signin': {
            'bookmarks': False,
            'history': False,
            'passwords': False,
            'preferences': False
        },
        'encryption_bootstrap_token_per_account_migration_done': True,
        'passwords_per_account_pref_migration_done': True,
        'feature_status_for_sync_to_signin': 5
    },
    
    # Serviços do Google
    'google': {
        'services': {
            'signin_scoped_device_id': '<your-device-id>'  # Gere um ID único
        }
    },
    
    # GAIA (Google Accounts Infrastructure)
    'gaia_cookie': {
        'changed_time': str(int(time.time())),
        'hash': '',
        'last_list_accounts_data': '[]'
    }
}
```

### Otimização e Rastreamento de Desempenho

```python
import time
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.browser_preferences = {
    # Guia de otimização (dicas de desempenho do Google)
    'optimization_guide': {
        'hintsfetcher': {
            'hosts_successfully_fetched': {}
        },
        'predictionmodelfetcher': {
            'last_fetch_attempt': str(int(time.time())),
            'last_fetch_success': str(int(time.time()))
        },
        'previously_registered_optimization_types': {}
    },
    
    # Clusters de histórico (agrupando navegação relacionada)
    'history_clusters': {
        'all_cache': {
            'all_keywords': {},
            'all_timestamp': str(int(time.time()))
        },
        'last_selected_tab': 0,
        'short_cache': {
            'short_keywords': {},
            'short_timestamp': '0'
        }
    },
    
    # Métricas de diversidade de domínio
    'domain_diversity': {
        'last_reporting_timestamp': str(int(time.time()))
    },
    
    # Plataforma de segmentação (análise de comportamento do usuário)
    'segmentation_platform': {
        'device_switcher_util': {
            'result': {
                'labels': ['NotSynced']
            }
        },
        'last_db_compaction_time': str(int(time.time()))
    },
    
    # Zero suggest (previsões da omnibox)
    'zerosuggest': {
        'cachedresults': '',
        'cachedresults_with_url': {}
    }
}
```

!!! info "Preferências de Rastreamento de Desempenho"
    Essas preferências são tipicamente usadas pelo Chrome para rastrear e otimizar o desempenho. Para automação, você pode deixá-las vazias ou definir valores realistas para parecer mais com um navegador normal.

### Eventos de Sessão e Tratamento de Falhas

O Chrome rastreia o histórico da sessão para recuperação e telemetria:

```python
import time
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.browser_preferences = {
    'sessions': {
        'event_log': [
            {
                'crashed': False,
                'time': str(int(time.time() * 1000000) + 11644473600000000),
                'type': 0                   # 0=início da sessão
            },
            {
                'crashed': False,
                'did_schedule_command': True,
                'first_session_service': True,
                'tab_count': 1,
                'time': str(int(time.time() * 1000000) + 11644473600000000),
                'type': 2,                  # 2=dados da sessão salvos
                'window_count': 1
            }
        ],
        'session_data_status': 3            # 0=desconhecido, 1=sem dados, 2=alguns dados, 3=dados completos
    },
    
    # Tipo de saída do perfil (importante para fingerprinting)
    'profile': {
        'exit_type': 'Crashed'              # 'Normal', 'Crashed', 'SessionEnded'
    }
}
```

!!! warning "Crashed vs Normal"
    A maioria dos navegadores reais **falha ocasionalmente**. Mostrar sempre a saída `'Normal'` é suspeito.
    
    **Estratégia realista**: Defina `'Crashed'` para ~10-20% dos perfis para simular a experiência normal do usuário. Ironicamente, ter falhas ocasionais faz sua automação parecer mais humana.

!!! tip "Tipos de Eventos de Sessão"
    - **Tipo 0**: Início da sessão
    - **Tipo 1**: Sessão terminada normalmente
    - **Tipo 2**: Dados da sessão salvos (abas, janelas)
    - **Tipo 3**: Sessão restaurada
    
    O `event_log` constrói um histórico de sessões do navegador ao longo do tempo.

## Furtividade (Stealth) e Fingerprinting

Criar um fingerprint de navegador realista é crucial para evitar sistemas de detecção de bots. Esta seção cobre técnicas básicas e avançadas.

### Configuração Rápida de Furtividade

Para a maioria dos casos de uso, esta configuração simples fornece boa anti-detecção:

```python
import asyncio
import time
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def quick_stealth():
    options = ChromiumOptions()
    
    # Simular um navegador com 60 dias de uso
    fake_timestamp = int(time.time()) - (60 * 24 * 60 * 60)
    
    options.browser_preferences = {
        # Histórico de uso falso
        'profile': {
            'last_engagement_time': fake_timestamp,
            'exited_cleanly': True,
            'exit_type': 'Normal'
        },
        
        # Página inicial realista
        'homepage': 'https://www.google.com',
        'session': {
            'restore_on_startup': 1,
            'startup_urls': ['https://www.google.com']
        },
        
        # Habilitar recursos que usuários reais têm
        'enable_do_not_track': False,  # A maioria dos usuários não habilita isso
        'safebrowsing': {'enabled': True},
        'autofill': {'enabled': True},
        'search': {'suggest_enabled': True},
        'dns_prefetching': {'enabled': True}
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://bot-detection-site.com')
        print("Modo furtivo ativado!")

asyncio.run(quick_stealth())
```

!!! tip "Princípios Chave da Furtividade"
    **Habilite, não desabilite**: Usuários reais têm Safe Browsing, preenchimento automático e sugestões de busca habilitados. Desabilitar tudo parece suspeito.
    
    **Envelheça seu perfil**: Instalações novas são um sinal de alerta. Simule um navegador que foi usado por semanas ou meses.
    
    **Combine com a maioria**: Use configurações padrão que 90% dos usuários têm, não configurações focadas em privacidade.

### Fingerprinting Avançado

Para máximo realismo, simule um histórico detalhado de uso do navegador:

```python
import time
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

def create_realistic_browser() -> ChromiumOptions:
    """Cria um navegador com resistência abrangente a fingerprinting."""
    options = ChromiumOptions()
    
    # Timestamps
    current_time = int(time.time())
    install_time = current_time - (90 * 24 * 60 * 60)  # 90 dias atrás
    last_use = current_time - (3 * 60 * 60)            # 3 horas atrás
    
    options.browser_preferences = {
        # Metadados do perfil (crítico para fingerprinting)
        'profile': {
            'created_by_version': '130.0.6723.91',      # Deve corresponder à sua versão do Chrome
            'creation_time': str(install_time),
            'last_engagement_time': str(last_use),
            'exit_type': 'Crashed',                     # 'Normal', 'Crashed', 'SessionEnded'
            'name': 'Pessoa 1',                         # Nome de perfil realista
            'avatar_index': 26,                         # 0-26 avatares disponíveis
            
            # Configurações de conteúdo realistas
            'default_content_setting_values': {
                'cookies': 1,
                'images': 1,
                'javascript': 1,
                'popups': 0,
                'notifications': 2,
                'geolocation': 0,           # Perguntar (não bloquear)
                'media_stream': 0           # Perguntar (realista)
            },
            
            'password_manager_enabled': False,
            'cookie_controls_mode': 0,
            'content_settings': {
                'pref_version': 1,
                'enable_quiet_permission_ui': {
                    'notifications': False
                },
                'enable_quiet_permission_ui_enabling_method': {
                    'notifications': 1
                }
            },
            
            # Metadados de segurança
            'family_member_role': 'not_in_family',
            'managed_user_id': '',
            'were_old_google_logins_removed': True
        },
        
        # Metadados de uso do navegador
        'browser': {
            'has_seen_welcome_page': True,
            'window_placement': {
                'work_area_bottom': 1080,
                'work_area_left': 0,
                'work_area_right': 1920,
                'work_area_top': 0
            }
        },
        
        # Metadados de instalação
        'countryid_at_install': 16978,              # Varia por país
        'default_apps_install_state': 3,
        
        # Metadados de extensões
        'extensions': {
            'last_chrome_version': '130.0.6723.91',  # Deve corresponder à sua versão
            'alerts': {'initialized': True},
            'theme': {'system_theme': 2}
        },
        
        # Atividade da sessão (mostra uso regular)
        'in_product_help': {
            'session_start_time': str(current_time),
            'session_last_active_time': str(current_time),
            'recent_session_start_times': [
                str(current_time - (24 * 60 * 60)),
                str(current_time - (48 * 60 * 60)),
                str(current_time - (72 * 60 * 60))
            ]
        },
        
        # Restauração de sessão
        'session': {
            'restore_on_startup': 1,
            'startup_urls': ['https://www.google.com']
        },
        
        # Página inicial
        'homepage': 'https://www.google.com',
        'homepage_is_newtabpage': False,
        
        # Histórico de tradução (mostra uso multilíngue)
        'translate': {'enabled': True},
        'translate_accepted_count': {'es': 2, 'fr': 1},
        'translate_denied_count_for_language': {'en': 1},
        
        # Verificação ortográfica
        'spellcheck': {
            'dictionaries': ['en-US', 'pt-BR'],
            'dictionary': ''
        },
        
        # Idiomas
        'intl': {
            'selected_languages': 'en-US,en,pt-BR'
        },
        
        # Metadados de login
        'signin': {
            'allowed': True,
            'cookie_clear_on_exit_migration_notice_complete': True
        },
        
        # Safe Browsing (a maioria dos usuários tem isso)
        'safebrowsing': {
            'enabled': True,
            'enhanced': False
        },
        
        # Preenchimento automático (comum para usuários reais)
        'autofill': {
            'enabled': True,
            'profile_enabled': True
        },
        
        # Sugestões de busca
        'search': {'suggest_enabled': True},
        
        # DNS prefetch
        'dns_prefetching': {'enabled': True},
        
        # Do NOT Track (geralmente desligado)
        'enable_do_not_track': False,
        
        # WebRTC (configurações padrão)
        'webrtc': {
            'ip_handling_policy': 'default',
            'multiple_routes_enabled': True
        },
        
        # Privacy Sandbox (novo sistema de rastreamento do Google - usuários realistas têm isso)
        'privacy_sandbox': {
            'first_party_sets_data_access_allowed_initialized': True,
            'm1': {
                'ad_measurement_enabled': True,
                'fledge_enabled': True,
                'row_notice_acknowledged': True,
                'topics_enabled': True
            }
        },
        
        # Engajamento de mídia
        'media': {
            'engagement': {'schema_version': 5}
        },
        
        # Web apps
        'web_apps': {
            'did_migrate_default_chrome_apps': ['app-id'],
            'last_preinstall_synchronize_version': '130'
        }
    }
    
    return options

# Uso
async def advanced_stealth():
    options = create_realistic_browser()
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://advanced-bot-detection.com')
        # O navegador aparece como uma instalação genuína de 90 dias

```

!!! warning "Consistência de Versão é Crítica"
    **Sempre combine as versões do Chrome**: Garanta que `profile.created_by_version` e `extensions.last_chrome_version` correspondam à sua versão real do Chrome. Versões incompatíveis são um sinal de alerta instantâneo.
    
    ```python
    # Obtenha sua versão do Chrome programaticamente:
    async with Chrome() as browser:
        tab = await browser.start()
        version = await browser.get_version()
        chrome_version = version['product'].split('/')[1]  # ex: '130.0.6723.91'
        print(f"Use esta versão: {chrome_version}")
    ```

!!! info "O que as Preferências de Fingerprinting Fazem"
    **Idade do perfil**: `creation_time` e `last_engagement_time` provam que o navegador não é uma instalação nova.
    
    **Histórico de uso**: `recent_session_start_times` mostra padrões regulares de navegação.
    
    **Histórico de tradução**: `translate_accepted_count` indica uma pessoa real usando múltiplos idiomas.
    
    **Posicionamento da janela**: Dimensões de tela realistas que correspondem a resoluções de monitor reais.
    
    **Privacy Sandbox**: Novo sistema de rastreamento do Google. Desabilitá-lo é incomum e suspeito.

## Impacto no Desempenho

Entender as implicações de desempenho das preferências do navegador ajuda a otimizar para seu caso de uso específico:

| Categoria de Preferência | Impacto Esperado | Caso de Uso |
|---|---|---|
| Desabilitar imagens | 50-70% carregamentos mais rápidos | Raspagem de conteúdo de texto |
| Desabilitar prefetch | 10-20% carregamentos mais rápidos | Reduzir uso de banda |
| Desabilitar plugins | 5-10% carregamentos mais rápidos | Segurança e desempenho |
| Bloquear notificações | Elimina popups | Automação limpa |
| Downloads silenciosos | Elimina prompts | Downloads automatizados de arquivos |

!!! tip "Troca entre Velocidade e Furtividade"
    **Para velocidade**: Desabilite imagens, prefetch, plugins e verificação ortográfica.
    
    **Para furtividade**: Habilite Safe Browsing, preenchimento automático, sugestões de busca e DNS prefetch (mesmo que eles tornem as coisas mais lentas).
    
    **Abordagem equilibrada**: Habilite recursos de furtividade, mas desabilite imagens e plugins. Isso dá 40-50% de ganho de velocidade enquanto mantém um fingerprint realista.

## Veja Também

- **[Análise Profunda: Preferências do Navegador](../../deep-dive/browser-preferences.md)** - Detalhes arquitetônicos e internos
- **[Estado de Carregamento da Página](page-load-state.md)** - Controle quando as páginas são consideradas carregadas
- **[Configuração de Proxy](proxy.md)** - Configure proxies de rede
- **[Cookies e Sessões](../browser-management/cookies-sessions.md)** - Gerencie o estado do navegador
- **[Código-Fonte do Chromium: pref_names.cc](https://chromium.googlesource.com/chromium/src/+/main/chrome/common/pref_names.cc)** - Constantes oficiais de preferência
- **[Código-Fonte do Chromium: pref_names.h](https://github.com/chromium/chromium/blob/main/chrome/common/pref_names.h)** - Arquivo de cabeçalho com definições

As preferências personalizadas do navegador oferecem um controle sem precedentes sobre o comportamento do navegador, permitindo automação sofisticada, otimização de desempenho e configuração de privacidade que simplesmente não são possíveis com ferramentas de automação tradicionais. Este nível de acesso transforma o Pydoll de uma simples biblioteca de automação em um sistema completo de controle de navegador.

================================================
FILE: docs/pt/features/configuration/proxy.md
================================================
# Configuração de Proxy

Proxies são essenciais para a automação web profissional, permitindo contornar limites de requisições (rate limits), acessar conteúdo geo-restrito e manter o anonimato. O Pydoll oferece suporte nativo a proxies com tratamento automático de autenticação.

!!! info "Documentação Relacionada"
    - **[Opções do Navegador](browser-options.md)** - Argumentos de proxy via linha de comando
    - **[Interceptação de Requisições](../network/interception.md)** - Como a autenticação de proxy funciona internamente
    - **[Automação Furtiva](../automation/human-interactions.md)** - Combine proxies com anti-detecção
    - **[Análise Profunda da Arquitetura de Proxy](../../deep-dive/proxy-architecture.md)** - Fundamentos de rede, protocolos, segurança e construção do seu próprio proxy

## Por que Usar Proxies?

Proxies oferecem capacidades críticas para automação:

| Benefício | Descrição | Caso de Uso |
|---|---|---|
| **Rotação de IP** | Distribui requisições por múltiplos IPs | Evitar limites de requisição, raspar em escala |
| **Acesso Geográfico** | Acessa conteúdo bloqueado por região | Testar recursos geo-direcionados, contornar restrições |
| **Anonimato** | Esconde seu endereço IP real | Automação focada em privacidade, análise de concorrentes |
| **Distribuição de Carga** | Espalha o tráfego por múltiplos endpoints | Raspagem de alto volume, testes de estresse |
| **Evitar Banimento** | Previne banimentos permanentes de IP | Automação de longa duração, raspagem agressiva |

!!! tip "Quando Usar Proxies"
    **Sempre use proxies para:**
    
    - Raspagem web em produção (>100 requisições/hora)
    - Acessar conteúdo geo-restrito
    - Contornar limites de requisição ou bloqueios baseados em IP
    - Testar de diferentes regiões
    - Manter o anonimato
    
    **Você pode pular os proxies para:**
    
    - Desenvolvimento e testes locais
    - Automação interna/corporativa
    - Automação de baixo volume (<50 requisições/dia)
    - Quando raspando sua própria infraestrutura

## Tipos de Proxy

Diferentes protocolos de proxy servem a propósitos distintos:

| Tipo | Porta | Autenticação | Velocidade | Segurança | Caso de Uso |
|---|---|---|---|---|---|
| **HTTP** | 80, 8080 | Opcional | Rápido | Baixa | Raspagem web básica, dados não sensíveis |
| **HTTPS** | 443, 8443 | Opcional | Rápido | Média | Raspagem web segura, tráfego criptografado |
| **SOCKS5** | 1080, 1081 | Opcional | Média | Alta | Suporte total TCP/UDP, casos de uso avançados |

### Proxies HTTP/HTTPS

Proxies web padrão, ideais para a maioria das tarefas de automação:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def http_proxy_example():
    options = ChromiumOptions()
    
    # Proxy HTTP (não criptografado)
    options.add_argument('--proxy-server=http://proxy.example.com:8080')
    
    # Ou proxy HTTPS (criptografado)
    # options.add_argument('--proxy-server=https://proxy.example.com:8443')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Todo o tráfego passa pelo proxy
        await tab.go_to('https://httpbin.org/ip')
        
        # Verificar IP do proxy
        ip = await tab.execute_script('return document.body.textContent')
        print(f"IP Atual: {ip}")

asyncio.run(http_proxy_example())
```

**Prós:**

- Rápido e eficiente
- Amplo suporte em todos os serviços
- Fácil de configurar

**Contras:**

- HTTP: Sem criptografia (tráfego visível para o proxy)
- Pode ser detectado mais facilmente que o SOCKS5

### Proxies SOCKS5

Proxies avançados com suporte total a TCP/UDP:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def socks5_proxy_example():
    options = ChromiumOptions()
    
    # Proxy SOCKS5
    options.add_argument('--proxy-server=socks5://proxy.example.com:1080')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://httpbin.org/ip')

asyncio.run(socks5_proxy_example())
```

**Prós:**

- Agnóstico a protocolo (funciona com qualquer tráfego TCP/UDP)
- Melhor para casos de uso avançados (WebSockets, WebRTC)
- Mais furtivo (mais difícil de detectar)

**Contras:**

- Ligeiramente mais lento que HTTP/HTTPS
- Menos comum em serviços de proxy gratuitos/baratos

!!! info "SOCKS4 vs SOCKS5"
    **SOCKS5** é recomendado em vez do SOCKS4 porque:
    
    - Suporta autenticação (usuário/senha)
    - Lida com tráfego UDP (para WebRTC, DNS, etc.)
    - Fornece melhor tratamento de erros
    
    Use `socks5://` a menos que você precise especificamente de SOCKS4 (`socks4://`).

## Proxies Autenticados

O Pydoll lida automaticamente com a autenticação de proxy sem intervenção manual.

### Como a Autenticação Funciona

Quando você fornece credenciais na URL do proxy, o Pydoll:

1.  **Intercepta o desafio de autenticação** usando o domínio Fetch
2.  **Responde automaticamente** com as credenciais
3.  **Continua a navegação** sem interrupções

Isso acontece de forma transparente, você não precisa lidar com a autenticação manualmente!

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def authenticated_proxy_example():
    options = ChromiumOptions()
    
    # Proxy com autenticação (usuario:senha)
    options.add_argument('--proxy-server=http://user:pass@proxy.example.com:8080')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Autenticação tratada automaticamente!
        await tab.go_to('https://example.com')
        print("Conectado através de proxy autenticado")

asyncio.run(authenticated_proxy_example())
```

!!! tip "Formato das Credenciais"
    Inclua as credenciais diretamente na URL do proxy:

    - HTTP: `http://username:password@host:port`
    - HTTPS: `https://username:password@host:port`
    - SOCKS5: `socks5://username:password@host:port`

    O Pydoll extrai e usa automaticamente essas credenciais.

!!! warning "Limitação da Autenticação SOCKS5"
    **O Chrome não suporta autenticação SOCKS5 nativamente** ([Chromium Issue #40323993](https://issues.chromium.org/issues/40323993)). Credenciais incorporadas em `socks5://user:pass@host:port` são silenciosamente ignoradas — o Chrome envia apenas uma saudação "sem autenticação" para o proxy SOCKS5.

    Isso significa que a autenticação automática de proxy do Pydoll (via `Fetch.authRequired`) **não funciona para SOCKS5**, pois o Chrome nunca emite um desafio HTTP 407 para conexões SOCKS5.

    **Solução — Proxy forwarder local:**

    Execute um proxy SOCKS5 local (sem autenticação) que encaminha para o proxy autenticado remoto. O Pydoll fornece um script pronto para uso:

    ```python
    import asyncio
    from pydoll.utils import SOCKS5Forwarder
    from pydoll.browser.chromium import Chrome
    from pydoll.browser.options import ChromiumOptions

    async def main():
        forwarder = SOCKS5Forwarder(
            remote_host='proxy.example.com',
            remote_port=1080,
            username='myuser',
            password='mypass',
            local_port=1081,
        )
        async with forwarder:
            options = ChromiumOptions()
            options.add_argument('--proxy-server=socks5://127.0.0.1:1081')

            async with Chrome(options=options) as browser:
                tab = await browser.start()
                await tab.go_to('https://httpbin.org/ip')

    asyncio.run(main())
    ```

    O forwarder realiza o handshake de usuário/senha com o proxy remoto enquanto o Chrome se conecta ao localhost sem autenticação.

    Para a explicação técnica completa de por que isso acontece, veja **[Análise Profunda da Autenticação SOCKS5](../../deep-dive/network/socks-proxies.md#autenticacao-socks5-e-chrome)**.

### Detalhes da Implementação da Autenticação

O Pydoll usa o **domínio Fetch** do Chrome no nível do navegador para interceptar e lidar com desafios de autenticação:

```python
# Isso é tratado internamente pelo Pydoll
# Você não precisa escrever este código!

async def _handle_proxy_auth(event):
    """Manipulador interno de autenticação de proxy do Pydoll."""
    if event['params']['authChallenge']['source'] == 'Proxy':
        await browser.continue_request_with_auth(
            request_id=event['params']['requestId'],
            username='user',
            password='pass'
        )
```

!!! info "Nos Bastidores"
    Para detalhes técnicos sobre como o Pydoll intercepta e lida com a autenticação de proxy, veja:
    
    - **[Interceptação de Requisições](../network/interception.md)** - Domínio Fetch e manipulação de requisições
    - **[Sistema de Eventos](../advanced/event-system.md)** - Autenticação orientada a eventos

!!! warning "Conflitos do Domínio Fetch"
    Ao usar **proxies autenticados** + **interceptação de requisições no nível da aba**, esteja ciente:
    
    - O Pydoll habilita o Fetch no **Nível do Navegador** para autenticação de proxy
    - Se você habilitar o Fetch no **Nível da Aba**, eles compartilham o mesmo domínio
    - **Solução**: Chame `tab.go_to()` uma vez antes de habilitar a interceptação no nível da aba
    
    ```python
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # 1. Primeira navegação dispara autenticação do proxy (Fetch Nível Navegador)
        await tab.go_to('https://example.com')
        
        # 2. Então habilite a interceptação no nível da aba com segurança
        await tab.enable_fetch_events()
        await tab.on('Fetch.requestPaused', my_interceptor)
        
        # 3. Continue com sua automação
        await tab.go_to('https://example.com/page2')
    ```
    
    Veja [Interceptação de Requisição - Proxy + Interceptação](../network/interception.md#private-proxy-request-interception-fetch) para detalhes.

## Lista de Bypass de Proxy

Exclua domínios específicos de usar o proxy:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def proxy_bypass_example():
    options = ChromiumOptions()
    
    # Usar proxy para a maior parte do tráfego
    options.add_argument('--proxy-server=http://proxy.example.com:8080')
    
    # Mas ignorar o proxy para estes domínios
    options.add_argument('--proxy-bypass-list=localhost,127.0.0.1,*.local,internal.company.com')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Usa proxy
        await tab.go_to('https://external-site.com')
        
        # Ignora o proxy (conexão direta)
        await tab.go_to('http://localhost:8000')
        await tab.go_to('http://internal.company.com')

asyncio.run(proxy_bypass_example())
```

**Padrões da lista de bypass:**

| Padrão | Corresponde a | Exemplo |
|---|---|---|
| `localhost` | Apenas Localhost | `http://localhost` |
| `127.0.0.1` | IP de Loopback | `http://127.0.0.1` |
| `*.local` | Todos os domínios `.local` | `http://server.local` |
| `internal.company.com` | Domínio específico | `http://internal.company.com` |
| `192.168.1.*` | Faixa de IP | `http://192.168.1.100` |

!!! tip "Quando Usar a Lista de Bypass"
    Ignore o proxy para:
    
    - **Servidores de desenvolvimento local** (`localhost`, `127.0.0.1`)
    - **Recursos internos da empresa** (VPN, intranet)
    - **Ambientes de teste** (domínios `.local`, `.test`)
    - **Recursos de alta largura de banda** (quando o proxy é lento)

## PAC (Proxy Auto-Config)

Use um arquivo PAC para regras complexas de roteamento de proxy:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def pac_proxy_example():
    options = ChromiumOptions()
    
    # Carregar arquivo PAC de uma URL
    options.add_argument('--proxy-pac-url=http://proxy.example.com/proxy.pac')
    
    # Ou usar arquivo PAC local
    # options.add_argument('--proxy-pac-url=file:///path/to/proxy.pac')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')

asyncio.run(pac_proxy_example())
```

**Exemplo de arquivo PAC:**

```javascript
function FindProxyForURL(url, host) {
    // Conexão direta para endereços locais
    if (isInNet(host, "192.168.0.0", "255.255.0.0") ||
        isInNet(host, "127.0.0.0", "255.0.0.0")) {
        return "DIRECT";
    }
    
    // Usar proxy específico para certos domínios
    if (dnsDomainIs(host, ".example.com")) {
        return "PROXY proxy1.example.com:8080";
    }
    
    // Proxy padrão para todo o resto
    return "PROXY proxy2.example.com:8080";
}
```

!!! info "Casos de Uso de Arquivo PAC"
    Arquivos PAC são úteis para:
    
    - **Regras de roteamento complexas** (baseadas em domínio, IP)
    - **Failover de proxy** (tentar múltiplos proxies)
    - **Balanceamento de carga** (distribuir entre pool de proxies)
    - **Ambientes corporativos** (gerenciamento centralizado de proxy)

## Rotação de Proxies

Rotacione entre múltiplos proxies para melhor distribuição:

```python
import asyncio
from itertools import cycle
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def rotating_proxy_example():
    # Lista de proxies
    proxies = [
        'http://user:pass@proxy1.example.com:8080',
        'http://user:pass@proxy2.example.com:8080',
        'http://user:pass@proxy3.example.com:8080',
    ]
    
    # Alternar entre os proxies
    proxy_pool = cycle(proxies)
    
    # Raspar múltiplas URLs com diferentes proxies
    urls = [
        'https://example.com/page1',
        'https://example.com/page2',
        'https://example.com/page3',
    ]
    
    for url in urls:
        # Obter próximo proxy
        proxy = next(proxy_pool)
        
        # Configurar opções com este proxy
        options = ChromiumOptions()
        options.add_argument(f'--proxy-server={proxy}')
        
        # Usar proxy para esta instância do navegador
        async with Chrome(options=options) as browser:
            tab = await browser.start()
            await tab.go_to(url)
            
            title = await tab.execute_script('return document.title')
            print(f"[{proxy.split('@')[1]}] {url}: {title}")

asyncio.run(rotating_proxy_example())
```

!!! tip "Estratégias de Rotação de Proxy"
    **Rotação por navegador** (acima):

    - Cada instância do navegador usa um proxy diferente
    - Melhor para isolamento e evitar conflitos de sessão
    
    **Rotação por requisição**:

    - Mais complexo, requer interceptação de requisições
    - Veja [Interceptação de Requisições](../network/interception.md) para implementação

## Proxies Residenciais vs Datacenter

Entender os tipos de proxy ajuda a escolher o serviço certo:

| Característica | Residenciais | Datacenter |
|---|---|---|
| **Fonte do IP** | ISPs residenciais reais | Data centers |
| **Legitimidade** | Alta (usuários reais) | Baixa (faixas conhecidas) |
| **Risco de Detecção** | Muito baixo | Alto |
| **Velocidade** | Média (150-500ms) | Muito rápida (<50ms) |
| **Custo** | Caro ($5-15/GB) | Barato ($0.10-1/GB) |
| **Melhor Para** | Sites anti-bot, e-commerce | APIs, ferramentas internas |

### Proxies Residenciais

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def residential_proxy_example():
    """Usar proxy residencial para sites anti-bot."""
    options = ChromiumOptions()
    
    # Proxy residencial com alta pontuação de confiança
    options.add_argument('--proxy-server=http://user:pass@residential.proxy.com:8080')
    
    # Combinar com opções de furtividade
    options.add_argument('--disable-blink-features=AutomationControlled')
    options.add_argument('--user-agent=Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/130.0.0.0 Safari/537.36')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Acessar site protegido
        await tab.go_to('https://protected-site.com')
        print("Acessado com sucesso através de proxy residencial")

asyncio.run(residential_proxy_example())
```

**Quando usar Residenciais:**

- Sites com forte proteção anti-bot (Cloudflare, DataDome)
- Raspagem de e-commerce (Amazon, eBay, etc.)
- Automação de mídias sociais
- Serviços financeiros
- Qualquer site que bloqueia ativamente IPs de datacenter

### Proxies Datacenter

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def datacenter_proxy_example():
    """Usar proxy datacenter rápido para APIs e sites não protegidos."""
    options = ChromiumOptions()
    
    # Proxy datacenter rápido
    options.add_argument('--proxy-server=http://user:pass@datacenter.proxy.com:8080')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Raspagem rápida de API
        await tab.go_to('https://api.example.com/data')

asyncio.run(datacenter_proxy_example())
```

**Quando usar Datacenter:**

- APIs públicas sem limites de requisição
- Automação interna/corporativa
- Sites sem medidas anti-bot
- Raspagem de alto volume e crítica em velocidade
- Desenvolvimento e testes

!!! warning "A Qualidade do Proxy Importa"
    **Proxies ruins** causam mais problemas do que resolvem:
    
    - Tempos de resposta lentos (timeouts)
    - Falhas de conexão (taxas de erro)
    - IPs em lista negra (banimentos imediatos)
    - Vazamento do IP real (violação de privacidade)
    
    **Invista em proxies de qualidade** de provedores respeitáveis. Proxies gratuitos quase nunca valem a pena.

## Testando Seu Proxy

Verifique a configuração do proxy antes de rodar a automação em produção:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def test_proxy():
    """Testar conexão e configuração do proxy."""
    proxy_url = 'http://user:pass@proxy.example.com:8080'
    
    options = ChromiumOptions()
    options.add_argument(f'--proxy-server={proxy_url}')
    
    try:
        async with Chrome(options=options) as browser:
            tab = await browser.start()
            
            # Teste 1: Conexão
            print("Testando conexão do proxy...")
            await tab.go_to('https://httpbin.org/ip', timeout=10)
            
            # Teste 2: Verificação de IP
            print("Verificando IP do proxy...")
            ip_response = await tab.execute_script('return document.body.textContent')
            print(f"[OK] IP do Proxy: {ip_response}")
            
            # Teste 3: Localização geográfica (se disponível)
            await tab.go_to('https://ipapi.co/json/')
            geo_data = await tab.execute_script('return document.body.textContent')
            print(f"[OK] Dados geográficos: {geo_data}")
            
            # Teste 4: Teste de velocidade
            import time
            start = time.time()
            await tab.go_to('https://example.com')
            load_time = time.time() - start
            print(f"[OK] Tempo de carregamento: {load_time:.2f}s")
            
            if load_time > 5:
                print("[AVISO] Tempo de resposta do proxy lento")
            
            print("\n[SUCESSO] Todos os testes de proxy passaram!")
            
    except asyncio.TimeoutError:
        print("[ERRO] Timeout na conexão do proxy")
    except Exception as e:
        print(f"[ERRO] Teste de proxy falhou: {e}")

asyncio.run(test_proxy())
```

## Leitura Adicional

- **[Análise Profunda da Arquitetura de Proxy](../../deep-dive/proxy-architecture.md)** - Fundamentos de rede, TCP/UDP, HTTP/2/3, internos do SOCKS5, análise de segurança e construção do seu próprio servidor proxy
- **[Opções do Navegador](browser-options.md)** - Argumentos de linha de comando e configuração
- **[Interceptação de Requisições](../network/interception.md)** - Como a autenticação de proxy funciona
- **[Preferências do Navegador](browser-preferences.md)** - Furtividade e fingerprinting
- **[Contextos](../browser-management/contexts.md)** - Usando diferentes proxies por contexto

!!! tip "Comece Simples"
    Comece com uma configuração de proxy simples, teste exaustivamente, depois adicione complexidade (rotação, lógica de retentativa, monitoramento) conforme necessário. Proxies de qualidade são mais importantes do que estratégias complexas de rotação.
    
    Para aqueles interessados em entender proxies em um nível mais profundo, a **[Análise Profunda da Arquitetura de Proxy](../../deep-dive/proxy-architecture.md)** fornece cobertura abrangente de protocolos de rede, considerações de segurança e até o guia na construção do seu próprio servidor proxy.

================================================
FILE: docs/pt/features/core-concepts.md
================================================
# Conceitos Principais

Entender o que torna o Pydoll diferente começa com suas decisões fundamentais de design. Estas não são apenas escolhas técnicas; elas impactam diretamente como você escreve scripts de automação, quais problemas você pode resolver e quão confiáveis serão suas soluções.

## Zero WebDrivers

Uma das vantagens mais significativas do Pydoll é a eliminação completa das dependências do WebDriver. Se você já lutou com erros do tipo "a versão do chromedriver não corresponde à versão do Chrome" ou lidou com falhas misteriosas do driver, você apreciará esta abordagem.

### Como Funciona

Ferramentas tradicionais de automação de navegador, como o Selenium, dependem de executáveis WebDriver que atuam como intermediários entre seu código e o navegador. O Pydoll segue um caminho diferente, conectando-se diretamente aos navegadores através do Chrome DevTools Protocol (CDP).

```mermaid
graph LR
    %% Fluxo Pydoll
    subgraph P["Fluxo Pydoll"]
        direction LR
        P1["💻 Seu Codigo"] --> P2["🪄 Pydoll"]
        P2 --> P3["🌐 Navegador (via CDP)"]
    end

    %% Fluxo Tradicional Selenium
    subgraph S["Fluxo Tradicional Selenium"]
        direction LR
        S1["💻 Seu Codigo"] --> S2["🔌 Cliente WebDriver"]
        S2 --> S3["⚙️ Executavel WebDriver"]
        S3 --> S4["🌐 Navegador"]
    end

```

Quando você inicia um navegador com o Pydoll, é isto que acontece nos bastidores:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def main():
    # Isso cria uma instância do Navegador
    browser = Chrome()
    
    # start() inicia o Chrome com --remote-debugging-port
    # e estabelece uma conexão WebSocket com o endpoint CDP
    tab = await browser.start()
    
    # Agora você pode controlar o navegador através de comandos CDP
    await tab.go_to('https://example.com')
    
    await browser.stop()

asyncio.run(main())
```

Nos bastidores, `browser.start()` faz o seguinte:

1.  **Inicia o processo do navegador** com a flag `--remote-debugging-port=<porta>`
2.  **Aguarda o servidor CDP** ficar disponível nessa porta
3.  **Estabelece uma conexão WebSocket** com `ws://localhost:<porta>/devtools/...`
4.  **Retorna uma instância de Tab** pronta para automação

!!! info "Quer Saber Mais?"
    Para detalhes técnicos sobre como o processo do navegador é gerenciado internamente, veja a [Análise Profunda do Domínio do Navegador](../../deep-dive/browser-domain.md#browser-process-manager).

### Benefícios que Você Notará

**Sem Dores de Cabeça com Gerenciamento de Versão**
```python
# Com Selenium, você pode ver:
# SessionNotCreatedException: Esta versão do ChromeDriver suporta apenas a versão 120 do Chrome

# Com Pydoll, você só precisa ter o Chrome instalado:
async with Chrome() as browser:
    tab = await browser.start()  # Funciona com qualquer versão do Chrome
```

**Configuração Mais Simples**
```bash
# Configuração Selenium:
$ pip install selenium
$ brew install chromedriver  # ou baixe, chmod +x, adicione ao PATH...
$ chromedriver --version     # corresponde ao seu Chrome?

# Configuração Pydoll:
$ pip install pydoll-python  # É isso!
```

**Mais Confiável**

Sem o WebDriver como camada intermediária, há menos pontos de falha. Seu código se comunica diretamente com o navegador através de um protocolo bem definido que os próprios desenvolvedores do Chromium usam e mantêm.

### CDP: O Protocolo Por Trás da Mágica

O Chrome DevTools Protocol não é apenas para o Pydoll; é o mesmo protocolo que alimenta o Chrome DevTools quando você abre o inspetor. Isso significa:

- **Confiabilidade testada em batalha**: Usado por milhões de desenvolvedores diariamente
- **Capacidades ricas**: Tudo o que o DevTools pode fazer, o Pydoll pode fazer
- **Desenvolvimento ativo**: O Google mantém e evolui o CDP continuamente

!!! tip "Análise Profunda: Entendendo o CDP"
    Para uma compreensão abrangente de como o CDP funciona e por que ele é superior ao WebDriver, veja nossa [Análise Profunda do Chrome DevTools Protocol](../../deep-dive/cdp.md).

## Arquitetura Async-First (Prioritariamente Assíncrona)

O Pydoll não é apenas compatível com async; ele foi projetado desde o início para alavancar o framework `asyncio` do Python. Isso não é uma funcionalidade superficial; é fundamental para como o Pydoll alcança alto desempenho.

!!! info "Novo na Programação Assíncrona?"
    Se você não está familiarizado com a sintaxe `async`/`await` do Python ou conceitos do asyncio, recomendamos fortemente ler nosso guia [Entendendo Async/Await](../../deep-dive/connection-layer.md#understanding-asyncawait) primeiro. Ele explica os fundamentos com exemplos práticos que o ajudarão a entender como a arquitetura assíncrona do Pydoll funciona e por que ela é tão poderosa para automação de navegador.

### Por que Async é Importante para Automação de Navegador

A automação de navegador envolve muita espera: páginas carregando, elementos aparecendo, requisições de rede completando. Ferramentas síncronas tradicionais desperdiçam tempo de CPU durante essas esperas. A arquitetura assíncrona permite que você faça trabalho útil enquanto espera.

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def scrape_page(browser, url):
    """Raspar uma única página."""
    tab = await browser.new_tab()
    await tab.go_to(url)
    title = await tab.execute_script('return document.title')
    await tab.close()
    return title

async def main():
    urls = [
        'https://example.com/page1',
        'https://example.com/page2',
        'https://example.com/page3',
    ]
    
    async with Chrome() as browser:
        await browser.start()
        
        # Processar todas as URLs concorrentemente!
        titles = await asyncio.gather(
            *(scrape_page(browser, url) for url in urls)
        )
        
        print(titles)

asyncio.run(main())
```

Neste exemplo, em vez de raspar as páginas uma após a outra (o que poderia levar 3 × 2 segundos = 6 segundos), todas as três páginas são raspadas concorrentemente, levando aproximadamente 2 segundos no total.

### Concorrência Verdadeira vs Threading

Diferente de abordagens baseadas em threading, a arquitetura assíncrona do Pydoll fornece execução concorrente verdadeira sem a complexidade do gerenciamento de threads:

```mermaid
sequenceDiagram
    participant Main as Tarefa Principal
    participant Tab1 as Aba 1
    participant Tab2 as Aba 2
    participant Tab3 as Aba 3
    
    Main->>Tab1: go_to(url1)
    Main->>Tab2: go_to(url2)
    Main->>Tab3: go_to(url3)
    
    Note over Tab1,Tab3: Todas as abas navegam concorrentemente
    
    Tab1-->>Main: Pagina 1 carregada
    Tab2-->>Main: Pagina 2 carregada
    Tab3-->>Main: Pagina 3 carregada
    
    Main->>Main: Processar resultados
```

### Padrões Modernos do Python

O Pydoll abraça idiomas modernos do Python em toda a sua estrutura:

**Gerenciadores de Contexto**
```python
# Limpeza automática de recursos
async with Chrome() as browser:
    tab = await browser.start()
    # ... fazer trabalho ...
# O navegador é automaticamente parado ao sair do contexto
```

**Iteradores Assíncronos**
```python
# Receber eventos de rede à medida que ocorrem
await tab.enable_network_events()

async for event in tab.network_event_stream():
    if 'api' in event['params']['request']['url']:
        print(f"Chamada de API detectada: {event['params']['request']['url']}")
```

**Gerenciadores de Contexto Assíncronos para Operações**
```python
# Esperar e lidar com downloads
async with tab.expect_download(keep_file_at='/downloads') as dl:
    await (await tab.find(text='Download PDF')).click()
    pdf_data = await dl.read_bytes()
```

!!! tip "Análise Profunda"
    Quer entender como as operações assíncronas funcionam internamente? Confira a [Análise Profunda da Camada de Conexão](../../deep-dive/connection-layer.md) para detalhes de implementação.

### Implicações de Desempenho

O design "async-first" oferece melhorias mensuráveis de desempenho:

```python
import asyncio
import time
from pydoll.browser.chromium import Chrome

async def benchmark_concurrent():
    """Raspar 10 páginas concorrentemente."""
    async with Chrome() as browser:
        await browser.start()
        
        start = time.time()
        tasks = [
            browser.new_tab(f'https://example.com/page{i}')
            for i in range(10)
        ]
        await asyncio.gather(*tasks)
        elapsed = time.time() - start
        
        print(f"10 páginas carregadas em {elapsed:.2f}s")
        # Resultado típico: ~2-3 segundos vs 20+ segundos sequencialmente

asyncio.run(benchmark_concurrent())
```

## Suporte a Múltiplos Navegadores

O Pydoll fornece uma API unificada em todos os navegadores baseados em Chromium. Escreva sua automação uma vez, execute-a em qualquer lugar.

### Navegadores Suportados

**Google Chrome**: Alvo principal com suporte completo a funcionalidades.
```python
from pydoll.browser.chromium import Chrome

async with Chrome() as browser:
    tab = await browser.start()
```

**Microsoft Edge**: Suporte completo, incluindo funcionalidades específicas do Edge.
```python
from pydoll.browser.chromium import Edge

async with Edge() as browser:
    tab = await browser.start()
```

**Outros Navegadores Chromium**: Brave, Vivaldi, Opera, etc.
```python
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.binary_location = '/path/to/brave-browser'  # ou qualquer navegador Chromium

async with Chrome(options=options) as browser:
    tab = await browser.start()
```

O principal benefício: todos os navegadores baseados em Chromium compartilham a mesma API. Escreva sua automação uma vez, e ela funciona no Chrome, Edge, Brave ou qualquer outro navegador Chromium sem alterações de código.

### Testes Cross-Browser

Teste sua automação em múltiplos navegadores sem alterar o código:

```python
import asyncio
from pydoll.browser.chromium import Chrome, Edge

async def test_login(browser_class, browser_name):
    """Testar fluxo de login em um navegador específico."""
    async with browser_class() as browser:
        tab = await browser.start()
        await tab.go_to('https://app.example.com/login')
        
        await (await tab.find(id='username')).type_text('user@example.com')
        await (await tab.find(id='password')).type_text('password123')
        await (await tab.find(id='login-btn')).click()
        
        # Verificar sucesso do login
        success = await tab.find(id='dashboard', raise_exc=False)
        print(f"{browser_name} login: {'✓' if success else '✗'}")

async def main():
    # Testar tanto no Chrome quanto no Edge
    await test_login(Chrome, "Chrome")
    await test_login(Edge, "Edge")

asyncio.run(main())
```

## Comportamento Semelhante ao Humano

Navegadores automatizados são frequentemente detectáveis porque se comportam de forma robótica. O Pydoll inclui funcionalidades nativas para fazer as interações parecerem mais humanas.

### Digitação Natural

Usuários reais não digitam em velocidades perfeitamente consistentes. O método `type_text()` do Pydoll inclui atrasos aleatórios entre as teclas:

```python
# Digitar com tempo semelhante ao humano
username_field = await tab.find(id='username')
await username_field.type_text(
    'user@example.com',
    interval=0.1  # Média de 100ms entre teclas, com aleatoriedade
)

# Digitação mais rápida (ainda semelhante à humana)
await username_field.type_text(
    'user@example.com',
    interval=0.05  # Mais rápido, mas ainda varia
)

# Instantâneo (robótico; use apenas quando a velocidade importa mais que a furtividade)
await username_field.type_text(
    'user@example.com',
    interval=0
)
```

O parâmetro `interval` define o atraso médio, mas o Pydoll adiciona variação aleatória para tornar o tempo mais natural.

### Cliques Realistas

Cliques não são apenas "disparar e esquecer". O Pydoll automaticamente dispara todos os eventos de mouse que um usuário real dispararia:

```python
button = await tab.find(id='submit-button')

# Comportamento padrão: clica no centro do elemento
# Dispara automaticamente: mouseover, mouseenter, mousemove, mousedown, mouseup, click
await button.click()

# Clique com deslocamento (útil para evitar detecção em elementos maiores)
await button.click(offset_x=10, offset_y=5)
```

!!! info "Eventos do Mouse"
    O Pydoll dispara a sequência completa de eventos do mouse na ordem correta, simulando como navegadores reais lidam com cliques de usuários. Isso torna os cliques mais realistas em comparação com simples chamadas JavaScript `.click()`.

!!! warning "Considerações sobre Detecção"
    Embora o comportamento semelhante ao humano ajude a evitar a detecção básica de bots, sistemas anti-automação sofisticados usam muitos sinais. Combine essas funcionalidades com:
    
    - Fingerprints de navegador realistas (via preferências do navegador)
    - Configuração adequada de proxy
    - Atrasos razoáveis entre ações
    - Padrões de navegação variados

## Design Orientado a Eventos

Diferente da automação tradicional baseada em polling (verificação periódica), o Pydoll permite que você reaja a eventos do navegador assim que eles acontecem. Isso é mais eficiente e possibilita padrões de interação sofisticados.

### Monitoramento de Eventos em Tempo Real

Inscreva-se em eventos do navegador e execute callbacks quando eles dispararem:

```python
import asyncio
from functools import partial
from pydoll.browser.chromium import Chrome
from pydoll.protocol.page.events import PageEvent
from pydoll.protocol.network.events import NetworkEvent

async def main():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Reagir a eventos de carregamento de página
        async def on_page_load(event):
            print(f"Página carregada: {await tab.current_url}")
        
        await tab.enable_page_events()
        await tab.on(PageEvent.LOAD_EVENT_FIRED, on_page_load)
        
        # Monitorar requisições de rede
        async def on_request(tab, event):
            url = event['params']['request']['url']
            if '/api/' in url:
                print(f"Chamada de API: {url}")
        
        await tab.enable_network_events()
        await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, partial(on_request, tab))
        
        # Navegar e observar os eventos dispararem
        await tab.go_to('https://example.com')
        await asyncio.sleep(3)  # Deixar os eventos processarem

asyncio.run(main())
```

### Categorias de Eventos

O Pydoll expõe vários domínios de eventos CDP nos quais você pode se inscrever:

| Domínio | Eventos de Exemplo |
|---|---|
| **Eventos de Página** | Carregamento concluído, navegação, diálogos JavaScript |
| **Eventos de Rede** | Requisição enviada, resposta recebida, atividade WebSocket |
| **Eventos DOM** | Mudanças no DOM, modificações de atributos |
| **Eventos Fetch** | Requisição pausada, autenticação necessária |
| **Eventos de Runtime** | Mensagens do console, exceções |

### Padrões Práticos Orientados a Eventos

**Capturar Respostas de API**
```python
import json
from functools import partial
from pydoll.protocol.network.events import NetworkEvent

api_data = []

async def capture_api(tab, event):
    url = event['params']['response']['url']
    if '/api/data' in url:
        request_id = event['params']['requestId']
        body = await tab.get_network_response_body(request_id)
        api_data.append(json.loads(body))

await tab.enable_network_events()
await tab.on(NetworkEvent.RESPONSE_RECEIVED, partial(capture_api, tab))

# Navegar e capturar automaticamente as respostas da API
await tab.go_to('https://app.example.com')
await asyncio.sleep(2)

print(f"Capturadas {len(api_data)} respostas de API")
```

**Esperar por Condições Específicas**
```python
import asyncio
from functools import partial
from pydoll.protocol.network.events import NetworkEvent

async def wait_for_api_call(tab, endpoint):
    """Esperar por uma chamada de endpoint de API específica."""
    event_occurred = asyncio.Event()
    
    async def check_endpoint(tab, event):
        url = event['params']['request']['url']
        if endpoint in url:
            event_occurred.set()
    
    await tab.enable_network_events()
    callback_id = await tab.on(
        NetworkEvent.REQUEST_WILL_BE_SENT,
        partial(check_endpoint, tab),
        temporary=True  # Remover automaticamente após o primeiro disparo
    )

    await event_occurred.wait()
    print(f"Endpoint de API {endpoint} foi chamado!")

# Uso
await wait_for_api_call(tab, '/api/users')
```

!!! info "Análise Profunda: Detalhes do Sistema de Eventos"
    Para um guia completo sobre manejo de eventos, padrões de callback e considerações de desempenho, veja a [Análise Profunda do Sistema de Eventos](../../deep-dive/event-system.md).

### Desempenho de Eventos

Eventos são poderosos, mas vêm com uma sobrecarga. Melhores práticas:

```python
# ✓ Bom: Habilitar apenas o que você precisa
await tab.enable_network_events()

# ✗ Evite: Habilitar todos os eventos desnecessariamente
await tab.enable_page_events()
await tab.enable_network_events()
await tab.enable_dom_events()
await tab.enable_fetch_events()
await tab.enable_runtime_events()

# ✓ Bom: Filtrar cedo nos callbacks
async def handle_request(event):
    url = event['params']['request']['url']
    if '/api/' not in url:
        return  # Pular requisições não-API cedo
    # Processar requisição de API...

# ✓ Bom: Desabilitar quando terminar
await tab.disable_network_events()
```

## Juntando Tudo

Esses conceitos principais trabalham juntos para criar um framework de automação poderoso:

```python
import asyncio
import json
from functools import partial
from pydoll.browser.chromium import Chrome
from pydoll.protocol.network.events import NetworkEvent
from pydoll.constants import Keys

async def advanced_scraping():
    """Demonstra múltiplos conceitos principais trabalhando juntos."""
    async with Chrome() as browser:  # Gerenciador de contexto assíncrono
        tab = await browser.start()
        
        # Orientado a eventos: Capturar dados de API
        api_responses = []
        
        async def capture_data(tab, event):
            url = event['params']['response']['url']
            if '/api/products' in url:
                request_id = event['params']['requestId']
                body = await tab.get_network_response_body(request_id)
                api_responses.append(json.loads(body))
        
        await tab.enable_network_events()
        await tab.on(NetworkEvent.RESPONSE_RECEIVED, partial(capture_data, tab))
        
        # Navegar com simplicidade zero-webdriver
        await tab.go_to('https://example.com/products')
        
        # Interação semelhante à humana
        search = await tab.find(id='search')
        await search.type_text('laptop', interval=0.1)  # Digitação natural
        await search.press_keyboard_key(Keys.ENTER)
        
        # Esperar por respostas da API (eficiência assíncrona)
        await asyncio.sleep(2)
        
        print(f"Capturados {len(api_responses)} produtos da API")
        return api_responses

# Suporte a múltiplos navegadores: funciona com Chrome, Edge, etc.
asyncio.run(advanced_scraping())
```

Esses conceitos fundamentais informam todo o resto no Pydoll. À medida que você explora funcionalidades específicas, verá esses princípios em ação, trabalhando juntos para criar automação de navegador confiável, eficiente e sustentável.

---

## O Que Vem a Seguir?

Agora que você entende o design principal do Pydoll, está pronto para explorar funcionalidades específicas:

- **[Localização de Elementos](element-finding.md)** - Aprenda as APIs intuitivas de localização de elementos do Pydoll
- **[Funcionalidades de Rede](../network/monitoring.md)** - Aproveite o sistema de eventos para análise de rede
- **[Gerenciamento do Navegador](../browser-management/tabs.md)** - Use padrões assíncronos para operações concorrentes

Para um entendimento técnico mais profundo, explore a seção [Análise Profunda](../../deep-dive/index.md).

================================================
FILE: docs/pt/features/element-finding.md
================================================
# Localização de Elementos

Encontrar elementos em uma página web é a base da automação de navegadores. O Pydoll introduz uma abordagem revolucionária e intuitiva que torna a localização de elementos mais poderosa e fácil de usar do que os métodos tradicionais baseados em seletores.

## Por que a Abordagem do Pydoll é Diferente

Ferramentas tradicionais de automação de navegador forçam você a pensar em termos de seletores CSS e expressões XPath desde o início. O Pydoll inverte isso: você descreve o que está procurando usando atributos HTML naturais, e o Pydoll descobre a estratégia de seletor ideal.

```python
# Abordagem tradicional (outras ferramentas)
element = driver.find_element(By.XPATH, "//input[@type='email' and @name='username']")

# Abordagem do Pydoll
element = await tab.find(tag_name="input", type="email", name="username")
```

Ambos encontram o mesmo elemento, mas a sintaxe do Pydoll é mais clara, mais fácil de manter e menos propensa a erros.

### Visão Geral dos Métodos de Localização de Elementos

O Pydoll oferece três abordagens principais para encontrar elementos:

| Método | Usar Quando | Exemplo |
|---|---|---|
| **`find()`** | Você sabe os atributos HTML | `await tab.find(id="username")` |
| **`query()`** | Você tem um seletor CSS/XPath | `await tab.query("div.content")` |
| **Travessia** | Você quer explorar a partir de um elemento conhecido | `await element.get_children_elements()` |

```mermaid
flowchart LR
    A["Precisa de Elemento?"] --> B{"O que voce tem?"};
    B -->|"Atributos HTML"| C["Metodo find()"];
    B -->|"CSS/XPath"| D["Metodo query()"];
    B -->|"Elemento Pai"| E["Travessia"];
    
    C --> F["WebElement"];
    D --> F;
    E --> G["Lista de WebElements"];
```

!!! info "Análise profunda: Como Funciona"
    Curioso sobre como o Pydoll implementa a localização de elementos internamente? Confira a documentação [FindElements Mixin](../deep-dive/find-elements-mixin.md) para aprender sobre a arquitetura, otimizações de desempenho e estratégias internas de seletores.

## O Método find(): Seleção Natural de Elementos

O método `find()` é sua principal ferramenta para localizar elementos. Ele aceita atributos HTML comuns como parâmetros e constrói automaticamente o seletor mais eficiente.

### Uso Básico

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def basic_finding():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # Encontrar por ID (mais comum e mais rápido)
        username = await tab.find(id="username")
        
        # Encontrar por nome de classe
        submit_button = await tab.find(class_name="btn-primary")
        
        # Encontrar por nome de tag
        first_paragraph = await tab.find(tag_name="p")
        
        # Encontrar por atributo name
        email_field = await tab.find(name="email")
        
        # Encontrar por conteúdo de texto
        login_link = await tab.find(text="Login")

asyncio.run(basic_finding())
```

### Combinando Atributos para Precisão

O verdadeiro poder do `find()` vem da combinação de múltiplos atributos para criar seletores precisos:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def precise_finding():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/form')
        
        # Combinar nome de tag com tipo
        password_input = await tab.find(tag_name="input", type="password")
        
        # Combinar tag, classe e atributos personalizados
        submit_button = await tab.find(
            tag_name="button",
            class_name="btn",
            type="submit"
        )
        
        # Usar atributos data
        product_card = await tab.find(
            tag_name="div",
            data_testid="product-card",
            data_category="electronics"
        )
        
        # Combinar múltiplas condições
        specific_link = await tab.find(
            tag_name="a",
            class_name="nav-link",
            href="/dashboard"
        )

asyncio.run(precise_finding())
```

!!! info "Lógica de Combinação: E (AND)"
    Combinar atributos no `find()` funciona como uma operação E (AND). O elemento deve corresponder a **todos** os atributos fornecidos.
    
    Para cenários mais complexos que exigem lógica OU (OR) — como encontrar um elemento que pode ter um `id` ou um `name` diferente — a abordagem correta é encadear múltiplas chamadas `find()`, como demonstrado na seção "Exemplo Completo".

!!! tip "Convenção de Nomenclatura de Atributos"
    Use underscores para nomes de atributos com hífens. Por exemplo, `data-testid` se torna `data_testid`, e `aria-label` se torna `aria_label`. O Pydoll os converte automaticamente para o formato correto.

### Como o find() Seleciona a Estratégia Ideal

O Pydoll escolhe automaticamente o seletor mais eficiente com base nos atributos que você fornece:

| Atributos Fornecidos | Estratégia Usada | Desempenho |
|---|---|---|
| Único: `id` | `By.ID` | ⚡ Mais Rápido |
| Único: `class_name` | `By.CLASS_NAME` | ⚡ Rápido |
| Único: `name` | `By.NAME` | ⚡ Rápido |
| Único: `tag_name` | `By.TAG_NAME` | ⚡ Rápido |
| Único: `text` | `By.XPATH` | ⚡ Rápido |
| Múltiplos atributos | Expressão XPath | ✓ Eficiente |

```mermaid
flowchart LR
    A["Atributos do find()"] --> B{"Unico ou Multiplo?"};
    B -->|"Unico"| C["Seletor Direto"];
    B -->|"Multiplo"| D["Construir XPath"];
    C --> E["Execucao Rapida"];
    D --> E;
```

### Encontrando Múltiplos Elementos

Use `find_all=True` para obter uma lista de todos os elementos correspondentes:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def find_multiple():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/products')
        
        # Encontrar todos os cards de produto
        products = await tab.find(class_name="product-card", find_all=True)
        print(f"Encontrados {len(products)} produtos")
        
        # Encontrar todos os links na navegação
        nav_links = await tab.find(
            tag_name="a",
            class_name="nav-link",
            find_all=True
        )
        
        # Processar cada elemento
        for link in nav_links:
            text = await link.text
            href = await link.get_attribute("href")
            print(f"Link: {text} → {href}")

asyncio.run(find_multiple())
```

### Esperando por Elementos Dinâmicos

Aplicações web modernas carregam conteúdo dinamicamente. Use `timeout` para esperar que os elementos apareçam:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def wait_for_elements():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/dashboard')
        
        # Esperar até 10 segundos pelo elemento aparecer
        dynamic_content = await tab.find(
            class_name="dynamic-content",
            timeout=10
        )
        
        # Esperar por dados carregados via AJAX
        user_profile = await tab.find(
            id="user-profile",
            timeout=15
        )
        
        # Lidar com elementos que podem não aparecer
        optional_banner = await tab.find(
            class_name="promo-banner",
            timeout=3,
            raise_exc=False  # Retorna None se não encontrado
        )
        
        if optional_banner:
            await optional_banner.click()
        else:
            print("Nenhum banner promocional presente")

asyncio.run(wait_for_elements())
```

!!! warning "Melhores Práticas de Timeout"
    Use valores de timeout razoáveis. Muito curtos e você perderá elementos de carregamento lento; muito longos e você desperdiçará tempo esperando por elementos que não existem. Comece com 5-10 segundos para a maioria dos conteúdos dinâmicos.

## O Método query(): Acesso Direto a Seletores

Para desenvolvedores que preferem seletores tradicionais ou precisam de lógicas de seleção mais complexas, o método `query()` fornece acesso direto a seletores CSS e expressões XPath.

### Seletores CSS

Seletores CSS são rápidos, amplamente compreendidos e perfeitos para a maioria dos casos de uso:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def css_selector_examples():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # Seletores simples
        main_nav = await tab.query("nav.main-menu")
        first_article = await tab.query("article:first-child")
        
        # Seletores de atributo
        submit_button = await tab.query("button[type='submit']")
        required_inputs = await tab.query("input[required]", find_all=True)
        
        # Seletores complexos
        nested = await tab.query("div.container > .content .item:nth-child(2)")
        
        # Pseudo-classes
        first_enabled_button = await tab.query("button:not([disabled])")

asyncio.run(css_selector_examples())
```

### Expressões XPath

XPath se destaca em relações complexas e correspondência de texto:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def xpath_examples():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/table')
        
        # Correspondência de texto
        button = await tab.query("//button[contains(text(), 'Submit')]")
        
        # Navegar para o pai
        input_parent = await tab.query("//input[@name='email']/parent::div")
        
        # Encontrar elementos irmãos
        label_input = await tab.query(
            "//label[text()='Email:']/following-sibling::input"
        )
        
        # Consultas complexas de tabela
        edit_button = await tab.query(
            "//tr[td[text()='John Doe']]//button[@class='btn-edit']"
        )

asyncio.run(xpath_examples())
```

!!! info "CSS vs XPath: Qual Usar?"
    Para um guia completo sobre como escolher entre seletores CSS e XPath, incluindo referências de sintaxe e exemplos do mundo real, veja o [Guia de Seletores](../deep-dive/selectors-guide.md).

## Travessia do DOM: Filhos e Irmãos

Às vezes, você precisa explorar a árvore DOM a partir de um ponto de partida conhecido. O Pydoll fornece métodos dedicados para atravessar relações entre elementos.

### Estrutura da Árvore DOM

Entender a estrutura da árvore DOM ajuda a escolher o método de travessia correto:

```mermaid
graph TB
    Root[Raiz do Documento]
    Root --> Container[div id='container']
    
    Container --> Child1[div class='card']
    Container --> Child2[div class='card']
    Container --> Child3[div class='card']
    
    Child1 --> GrandChild1[h2 title]
    Child1 --> GrandChild2[p description]
    Child1 --> GrandChild3[button action]
    
    Child2 --> GrandChild4[h2 title]
    Child2 --> GrandChild5[p description]
    
    Child3 --> GrandChild6[h2 title]
```

### Obtendo Elementos Filhos

O método `get_children_elements()` recupera descendentes de um elemento:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def traverse_children():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/cards')
        
        # Obter contêiner
        container = await tab.find(id="cards-container")
        
        # Obter apenas filhos diretos (max_depth=1)
        direct_children = await container.get_children_elements(max_depth=1)
        print(f"Contêiner tem {len(direct_children)} filhos diretos")
        
        # Incluir netos (max_depth=2)
        descendants = await container.get_children_elements(max_depth=2)
        print(f"Encontrados {len(descendants)} elementos até 2 níveis de profundidade")
        
        # Filtrar por nome de tag
        links = await container.get_children_elements(
            max_depth=3,
            tag_filter=["a"]
        )
        print(f"Encontrados {len(links)} links no contêiner")
        
        # Combinar filtros para elementos específicos
        nav_links = await container.get_children_elements(
            max_depth=2,
            tag_filter=["a", "button"]
        )

asyncio.run(traverse_children())
```

### Obtendo Elementos Irmãos

O método `get_siblings_elements()` encontra elementos no mesmo nível:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def traverse_siblings():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/list')
        
        # Encontrar item ativo
        active_item = await tab.find(class_name="item-active")
        
        # Obter todos os irmãos (excluindo o próprio active_item)
        all_siblings = await active_item.get_siblings_elements()
        print(f"Item ativo tem {len(all_siblings)} irmãos")
        
        # Filtrar irmãos por tag
        link_siblings = await active_item.get_siblings_elements(
            tag_filter=["a"]
        )
        
        # Processar elementos irmãos
        for sibling in all_siblings:
            text = await sibling.text
            print(f"Irmão: {text}")

asyncio.run(traverse_siblings())
```

!!! tip "Considerações de Desempenho"
    A travessia do DOM pode ser cara para árvores grandes. Prefira valores `max_depth` rasos e parâmetros `tag_filter` específicos para minimizar o número de nós processados. Para estruturas profundamente aninhadas, considere múltiplas chamadas `find()` direcionadas em vez de uma única travessia profunda.

## Encontrando Elementos Dentro de Elementos

Uma vez que você tem um elemento, pode pesquisar dentro de seu escopo usando os mesmos métodos `find()` e `query()`.

!!! warning "Importante: Comportamento de Profundidade de Busca"
    Quando você chama `element.find()` ou `element.query()`, o Pydoll busca em **TODOS os descendentes** (filhos, netos, bisnetos, etc.), não apenas nos filhos diretos. Este é o comportamento padrão do `querySelector()` e corresponde ao que a maioria dos desenvolvedores espera.

### Entendendo o Escopo de Busca

```mermaid
graph TB
    Container[div id='container']
    
    Container --> Child1[div class='card' ✓]
    Container --> Child2[div class='card' ✓]
    Container --> Child3[div class='other']
    
    Child1 --> GrandChild1[div class='card' ✓]
    Child1 --> GrandChild2[p class='text']
    
    Child3 --> GrandChild3[div class='card' ✓]
    Child3 --> GrandChild4[div class='card' ✓]
```

```python
# Isso encontra TODOS os 5 elementos com class='card' na árvore
# (2 filhos diretos + 3 descendentes aninhados)
cards = await container.find(class_name="card", find_all=True)
print(len(cards))  # Saída: 5
```

### Busca Básica com Escopo

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def scoped_search():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/products')
        
        # Encontrar um contêiner de produto
        product_card = await tab.find(class_name="product-card")
        
        # Pesquisar dentro do card de produto (busca em TODOS os descendentes, retorna apenas a primeira correspondência)
        product_title = await product_card.find(class_name="title")
        product_price = await product_card.find(class_name="price")
        add_button = await product_card.find(tag_name="button", text="Add to Cart")
        
        # Fazer query dentro do escopo
        product_image = await product_card.query("img.product-image")
        
        # Encontrar todos os itens dentro de um contêiner (TODOS os descendentes)
        nav_menu = await tab.find(class_name="nav-menu")
        menu_items = await nav_menu.find(tag_name="li", find_all=True)
        
        print(f"Menu tem {len(menu_items)} itens")

asyncio.run(scoped_search())
```

### Encontrando Apenas Filhos Diretos

Se você precisa encontrar **apenas filhos diretos** (profundidade 1), use o combinador filho `>` do CSS ou XPath:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def direct_children_only():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/cards')
        
        container = await tab.find(id="cards-container")
        
        # Método 1: Combinador filho CSS (>)
        # Encontra APENAS filhos diretos com class='card'
        direct_cards = await container.query("> .card", find_all=True)
        print(f"Filhos diretos: {len(direct_cards)}")
        
        # Método 2: XPath filho direto
        direct_divs = await container.query("./div[@class='card']", find_all=True)
        
        # Método 3: Usar get_children_elements() com max_depth=1
        # (mas isso filtra apenas por tag, não por outros atributos)
        direct_children = await container.get_children_elements(
            max_depth=1,
            tag_filter=["div"]
        )
        
        # Então filtre manualmente por classe
        cards_only = [
            child for child in direct_children
            if 'card' in (await child.get_attribute('class') or '')
        ]

asyncio.run(direct_children_only())
```

### Comparação: find() vs get_children_elements()

| Funcionalidade | `find()` / `query()` | `get_children_elements()` |
|---|---|---|
| **Profundidade de Busca** | TODOS os descendentes | Configurável com `max_depth` |
| **Filtrar Por** | Qualquer atributo HTML | Apenas nome da tag |
| **Caso de Uso** | Encontrar elementos específicos em qualquer lugar na subárvore | Explorar estrutura DOM, obter filhos diretos |
| **Desempenho** | Otimizado para atributo único | Bom para exploração ampla |
| **Parâmetro** | `tag_name="a"` (string) | `tag_filter=["a"]` (lista) |

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def comparison_example():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        container = await tab.find(id="container")
        
        # Cenário 1: Eu quero TODOS os links em qualquer lugar no contêiner
        # Use find() - busca em todos os descendentes
        all_links = await container.find(tag_name="a", find_all=True)
        
        # Cenário 2: Eu quero APENAS links filhos diretos
        # Use combinador filho CSS
        direct_links = await container.query("> a", find_all=True)
        
        # Cenário 3: Eu quero filhos diretos com classe específica
        # Use combinador filho CSS
        direct_cards = await container.query("> .card", find_all=True)
        
        # Cenário 4: Eu quero explorar a estrutura DOM
        # Use get_children_elements()
        direct_children = await container.get_children_elements(max_depth=1)
        
        # Cenário 5: Eu quero todos os descendentes até a profundidade 2, filtrados por tag
        # Use get_children_elements()
        shallow_links = await container.get_children_elements(
            max_depth=2,
            tag_filter=["a"]
        )

asyncio.run(comparison_example())
```

!!! tip "Quando Usar Cada Método"
    - **Use `find()`**: Quando você sabe os atributos (classe, id, etc.) e quer pesquisar toda a subárvore
    - **Use `query("> .class")`**: Quando você precisa apenas de filhos diretos com atributos específicos
    - **Use `get_children_elements()`**: Ao explorar a estrutura DOM ou filtrar apenas por tag

### Casos de Uso Comuns

Essa busca com escopo é incrivelmente útil para trabalhar com padrões repetitivos como:

- Cards de produtos em sites de e-commerce
- Linhas de tabela com múltiplas células
- Seções de formulário com múltiplos campos
- Menus de navegação com itens aninhados

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def practical_example():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/products')
        
        # Encontrar todos os cards de produto na página
        product_cards = await tab.find(class_name="product-card", find_all=True)
        
        for card in product_cards:
            # Dentro de cada card, encontrar TODOS os descendentes com essas classes
            title = await card.find(class_name="product-title")
            price = await card.find(class_name="product-price")
            
            # Obter o botão que está em qualquer lugar dentro deste card
            buy_button = await card.find(tag_name="button", text="Buy Now")
            
            title_text = await title.text
            price_text = await price.text
            
            print(f"Produto: {title_text}, Preço: {price_text}")
            
            # Clicar no botão de compra
            await buy_button.click()

asyncio.run(practical_example())
```


## Suporte a Shadow DOM

Muitas aplicações web modernas utilizam [Shadow DOM](https://developer.mozilla.org/pt-BR/docs/Web/API/Web_components/Using_shadow_DOM) para encapsular os internos de componentes. O Pydoll fornece acesso transparente a elementos dentro de árvores shadow através da classe `ShadowRoot`.

### Como o Shadow DOM Funciona

```mermaid
graph TB
    Host["div#my-component (shadow host)"]
    SR["ShadowRoot (open)"]
    Internal1["button.internal-btn"]
    Internal2["input.internal-input"]

    Host --> SR
    SR --> Internal1
    SR --> Internal2
```

Elementos dentro de um shadow root são ocultos de consultas DOM regulares. Você precisa primeiro acessar o shadow root e então buscar dentro dele.

### Acessando Shadow Roots

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def shadow_dom_example():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/web-components')

        # Encontrar o elemento shadow host
        shadow_host = await tab.find(id='my-component')

        # Acessar seu shadow root
        shadow_root = await shadow_host.get_shadow_root()

        # Encontrar elementos dentro do shadow root usando query() com seletores CSS
        button = await shadow_root.query('.internal-btn')
        await button.click()

        input_field = await shadow_root.query('input[type="email"]')
        await input_field.type_text('user@example.com')

asyncio.run(shadow_dom_example())
```

### query() com Seletores CSS

`ShadowRoot` herda de `FindElementsMixin` com a restrição `_css_only`, o que significa que apenas `query()` com seletores CSS é suportado. O método `find()` e `query()` com XPath lançam `NotImplementedError`:

```python
# query() com seletores CSS — abordagem recomendada
element = await shadow_root.query('#inner-id')
element = await shadow_root.query('button.primary')
element = await shadow_root.query('div.container > .content')

# find_all para múltiplos elementos
items = await shadow_root.query('.item', find_all=True)

# Espera com timeout
element = await shadow_root.query('#dynamic', timeout=5)
```

!!! warning "find() e XPath não são suportados em ShadowRoot"
    Chamar `shadow_root.find()` ou `shadow_root.query('//xpath')` lançará `NotImplementedError`. Sempre use `query()` com seletores CSS ao trabalhar com shadow roots.

### Shadow Roots Aninhados

Web components podem conter outros web components com seus próprios shadow roots:

```python
async def nested_shadow():
    outer_host = await tab.find(tag_name='outer-component')
    outer_shadow = await outer_host.get_shadow_root()

    inner_host = await outer_shadow.query('inner-component')
    inner_shadow = await inner_host.get_shadow_root()

    deep_button = await inner_shadow.query('.deep-btn')
    await deep_button.click()
```

### Buscando Shadow Roots: find_shadow_roots()

Quando você precisa explorar quais shadow roots existem na página (útil para depuração ou páginas dinâmicas como desafios Cloudflare), use `find_shadow_roots()`:

```python
# Buscar todos os shadow roots na página
shadow_roots = await tab.find_shadow_roots()

for sr in shadow_roots:
    print(f'Modo: {sr.mode}, Host: {sr.host_element}')
    # Buscar dentro de cada shadow root
    btn = await sr.query('button', raise_exc=False)
    if btn:
        await btn.click()
```

#### Esperando Shadow Roots: `timeout`

Shadow hosts sao frequentemente injetados de forma assincrona (ex: Cloudflare Turnstile carregando dentro de um OOPIF). Use `timeout` para fazer polling ate que os shadow roots aparecam:

```python
# Esperar ate 10 segundos pelos shadow roots
shadow_roots = await tab.find_shadow_roots(timeout=10)
```

O metodo `get_shadow_root()` em elementos tambem suporta `timeout`:

```python
# Esperar pelo shadow root de um elemento
host = await tab.find(id='my-component', timeout=5)
shadow = await host.get_shadow_root(timeout=5)
```

#### Travessia Profunda: IFrames Cross-Origin (OOPIFs)

Por padrão, `find_shadow_roots()` percorre apenas a árvore DOM do documento principal (que inclui iframes same-origin via `contentDocument`, mas **não** iframes cross-origin). Passe `deep=True` para também descobrir shadow roots dentro de iframes cross-origin (OOPIFs):

```python
# Incluir shadow roots de iframes cross-origin (ex: Cloudflare Turnstile)
shadow_roots = await tab.find_shadow_roots(deep=True, timeout=10)

for sr in shadow_roots:
    print(f'Modo: {sr.mode}, Host: {sr.host_element}')
    # Elementos encontrados dentro desses shadow roots roteiam
    # automaticamente comandos CDP pela sessão OOPIF correta
    btn = await sr.query('input[type="checkbox"]', raise_exc=False)
    if btn:
        await btn.click()
```

!!! tip "Quando usar `deep=True`"
    Use `deep=True` ao automatizar páginas com widgets embutidos cross-origin, como captchas Cloudflare Turnstile, formulários de pagamento de terceiros ou botões de login social. Esses widgets tipicamente usam iframes cross-origin com shadow roots fechados dentro deles.

### Propriedades do Shadow Root

```python
shadow_root = await element.get_shadow_root()

# Verificar o modo do shadow root (open, closed ou user-agent)
print(shadow_root.mode)  # ShadowRootType.OPEN

# Acessar o elemento host
host = shadow_root.host_element

# Obter o HTML interno do shadow root
html = await shadow_root.inner_html
```

!!! note "Shadow Roots Fechados"
    Shadow roots fechados (`mode='closed'`) são acessíveis via CDP pois o protocolo ignora as restrições do JavaScript. Porém, alguns shadow roots internos do navegador (user-agent) podem ter acessibilidade limitada.

## Trabalhando com iFrames

!!! info "Guia Completo de IFrame Disponível"
    Esta seção cobre a interação básica com iframe para localização de elementos. Para um guia completo incluindo iframes aninhados, manejo de CAPTCHA, análise técnica profunda e solução de problemas, veja **[Trabalhando com IFrames](automation/iframes.md)**.

iFrames apresentam um desafio especial na automação de navegador porque eles têm contextos DOM separados. O Pydoll torna a interação com iframe transparente:

```mermaid
flowchart TB
    Principal[tab]
    IFrame["WebElement do iframe"]
    Conteudo["elementos dentro do iframe"]

    Principal -->|"find('iframe')"| IFrame
    IFrame -->|"find('button#submit')"| Conteudo
```
```python
import asyncio
from pydoll.browser.chromium import Chrome

async def iframe_interacao():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/pagina-com-iframe')

        iframe = await tab.query("iframe.conteudo", timeout=10)

        # Os utilitários de WebElement já executam dentro do iframe
        iframe_button = await iframe.find(tag_name="button", class_name="submit")
        await iframe_button.click()

        iframe_input = await iframe.find(id="captcha-input")
        await iframe_input.type_text("codigo-de-verificacao")

        # Iframe aninhado? Continue encadeando
        inner_iframe = await iframe.find(tag_name="iframe")
        download_link = await inner_iframe.find(text="Baixar PDF")
        await download_link.click()

asyncio.run(iframe_interacao())
```
!!! note "Screenshots em iframes"
    `tab.take_screenshot()` funciona apenas no alvo principal. Para capturar o conteúdo de um iframe, selecione um elemento dentro dele e chame `element.take_screenshot()`.

## Estratégias de Tratamento de Erros

Automação robusta requer o tratamento de casos onde elementos não existem ou demoram mais para aparecer do que o esperado.

### Fluxo de Localização de Elemento com Tratamento de Erros

```mermaid
flowchart TB
    Start[Iniciar Localizacao de Elemento] --> Immediate[Tentar Localizacao Imediata]
    
    Immediate --> Found1{Elemento Encontrado?}
    Found1 -->|Sim| Return1[Retornar WebElement]
    Found1 -->|Nao & timeout=0| Check1{raise_exc=True?}
    Found1 -->|Nao & timeout>0| Wait[Iniciar Loop de Espera]
    
    Check1 -->|Sim| Error1[Lancar ElementNotFound]
    Check1 -->|Nao| ReturnNone[Retornar None]
    
    Wait --> Sleep[Esperar 0.5 segundos]
    Sleep --> TryAgain[Tentar Localizar Novamente]
    TryAgain --> Found2{Elemento Encontrado?}
    
    Found2 -->|Sim| Return2[Retornar WebElement]
    Found2 -->|Nao| TimeCheck{Timeout Excedido?}
    
    TimeCheck -->|Nao| Sleep
    TimeCheck -->|Sim| Check2{raise_exc=True?}
    
    Check2 -->|Sim| Error2[Lancar WaitElementTimeout]
    Check2 -->|Nao| ReturnNone2[Retornar None]
```

### Usando o Parâmetro raise_exc

Controle se uma exceção deve ser lançada quando elementos não são encontrados:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.exceptions import ElementNotFound

async def error_handling():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # Lançar exceção se não encontrado (comportamento padrão)
        try:
            critical_element = await tab.find(id="must-exist")
        except ElementNotFound:
            print("Elemento crítico ausente! Não é possível continuar.")
            return
        
        # Retornar None se não encontrado (elementos opcionais)
        optional_banner = await tab.find(
            class_name="promo-banner",
            raise_exc=False
        )
        
        if optional_banner:
            print("Banner encontrado, fechando-o")
            close_button = await optional_banner.find(class_name="close-btn")
            await close_button.click()
        else:
            print("Nenhum banner presente, continuando")

asyncio.run(error_handling())
```

## Melhores Práticas

### 1. Prefira Seletores Estáveis

Use atributos que têm baixa probabilidade de mudar:

```python
# Bom: Atributos semânticos
await tab.find(id="user-profile")  # IDs geralmente são estáveis
await tab.find(data_testid="submit-button")  # IDs de teste são feitos para automação
await tab.find(name="username")  # Nomes de formulário são estáveis

# Evite: Dependências estruturais
await tab.query("div > div > div:nth-child(3) > input")  # Frágil, quebra facilmente
await tab.query("body > div:nth-child(2) > form > div:first-child")
```

### 2. Use o Seletor Mais Simples que Funciona

Comece simples e adicione complexidade apenas quando necessário:

```python
# Bom: Simples e claro
await tab.find(id="login-form")

# Desnecessário: Complicado demais
await tab.query("//div[@id='content']/descendant::form[@id='login-form']")
```

### 3. Escolha o Método Certo

- Use `find()` para buscas simples baseadas em atributos
- Use `query()` para padrões CSS ou XPath complexos
- Use métodos de travessia para explorar a partir de âncoras conhecidas

```python
# Use find() para casos diretos
username = await tab.find(id="username")

# Use query() para padrões complexos
active_nav_link = await tab.query("nav.menu a.active")

# Use travessia para buscas baseadas em relacionamento
container = await tab.find(id="cards")
child_links = await container.get_children_elements(tag_filter=["a"])
```

### 4. Adicione Timeouts Significativos

Não use timeouts zero para conteúdo dinâmico, e não espere para sempre por elementos opcionais:

```python
# Bom: Timeouts razoáveis
critical_data = await tab.find(id="data", timeout=10)
optional_popup = await tab.find(class_name="popup", timeout=2, raise_exc=False)

# Ruim: Sem timeout para conteúdo dinâmico
dynamic_element = await tab.find(class_name="ajax-loaded")  # Falhará imediatamente

# Ruim: Timeout muito longo para elemento opcional
banner = await tab.find(class_name="ad-banner", timeout=60)  # Desperdício de tempo
```

### 5. Trate Erros Graciosamente

Planeje para elementos que podem não existir:

```python
# Elementos críticos: deixe as exceções subirem
submit_button = await tab.find(id="submit-btn")

# Elementos opcionais: trate explicitamente
cookie_notice = await tab.find(class_name="cookie-notice", raise_exc=False)
if cookie_notice:
    accept_button = await cookie_notice.find(text="Accept")
    await accept_button.click()
```

## Exemplo Completo: Automação de Formulário

Aqui está um exemplo completo combinando múltiplas técnicas de localização de elementos:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.exceptions import ElementNotFound

async def automate_registration_form():
    async with Chrome() as browser:
        tab = await browser.start()
        
        try:
            # Navegar para a página de registro
            await tab.go_to('https://example.com/register', timeout=10)
            
            # Lidar com banner de cookie opcional
            cookie_banner = await tab.find(
                class_name="cookie-banner",
                timeout=2,
                raise_exc=False
            )
            if cookie_banner:
                accept = await cookie_banner.find(text="Accept")
                await accept.click()
                await asyncio.sleep(1)
            
            # Preencher o formulário de registro
            # Encontrar campos do formulário
            username_field = await tab.find(name="username", timeout=5)
            email_field = await tab.find(name="email")
            password_field = await tab.find(type="password", name="password")
            confirm_password = await tab.find(type="password", name="confirm_password")
            
            # Inserir informações
            await username_field.type_text("john_doe_2024", interval=0.1)
            await email_field.type_text("john@example.com", interval=0.1)
            await password_field.type_text("SecurePass123!", interval=0.1)
            await confirm_password.type_text("SecurePass123!", interval=0.1)
            
            # Encontrar e marcar checkbox de termos
            # Tentar múltiplas estratégias
            terms_checkbox = await tab.find(id="terms", raise_exc=False)
            if not terms_checkbox:
                terms_checkbox = await tab.find(name="accept_terms", raise_exc=False)
            if not terms_checkbox:
                terms_checkbox = await tab.query("input[type='checkbox']")
            
            await terms_checkbox.click()
            
            # Encontrar e clicar no botão de envio
            submit_button = await tab.find(
                tag_name="button",
                type="submit",
                timeout=2
            )
            await submit_button.click()
            
            # Esperar por mensagem de sucesso com timeout maior (processamento do formulário)
            success_message = await tab.find(
                class_name="success-message",
                timeout=15
            )
            
            message_text = await success_message.text
            print(f"Registro bem-sucedido: {message_text}")
            
            # Verificar redirecionamento para o dashboard
            await asyncio.sleep(2)
            current_url = await tab.current_url
            
            if "dashboard" in current_url:
                print("Redirecionado com sucesso para o dashboard")
                
                # Encontrar mensagem de boas-vindas
                welcome = await tab.find(class_name="welcome-message", timeout=5)
                welcome_text = await welcome.text
                print(f"Mensagem de boas-vindas: {welcome_text}")
            else:
                print(f"URL inesperada após registro: {current_url}")
                
        except ElementNotFound as e:
            print(f"Elemento não encontrado: {e}")
            # Tirar screenshot para depuração
            await tab.take_screenshot("error_screenshot.png")
        except Exception as e:
            print(f"Erro inesperado: {e}")
            await tab.take_screenshot("unexpected_error.png")

asyncio.run(automate_registration_form())
```

## Aprenda Mais

Quer mergulhar mais fundo na localização de elementos?

- **[Análise aprofundada em FindElements Mixin](../deep-dive/find-elements-mixin.md)**: Aprenda sobre a arquitetura, estratégias internas de seletores e otimizações de desempenho
- **[Guia de Seletores](../deep-dive/selectors-guide.md)**: Guia completo de seletores CSS e XPath com referências de sintaxe e exemplos do mundo real
- **[Domínio WebElement](../deep-dive/webelement-domain.md)**: Entenda o que você pode fazer com os elementos depois de encontrá-los

A localização de elementos é a base para uma automação de navegador bem-sucedida. Domine essas técnicas, e você será capaz de localizar confiavelmente qualquer elemento em qualquer página web, não importa quão complexa seja a estrutura.

================================================
FILE: docs/pt/features/index.md
================================================
# Guia de Funcionalidades

Bem-vindo à documentação abrangente de funcionalidades do Pydoll! Aqui você descobrirá tudo o que torna o Pydoll uma ferramenta de automação de navegador poderosa e flexível. Esteja você apenas começando ou procurando aproveitar capacidades avançadas, você encontrará guias detalhados, exemplos práticos e melhores práticas para cada funcionalidade.

## O Que Você Encontrará Aqui

Este guia está organizado em seções lógicas que refletem sua jornada na automação: de conceitos básicos a técnicas avançadas. Cada página é projetada para ser autocontida, para que você possa pular diretamente para o que lhe interessa ou seguir sequencialmente.

## Conceitos Principais

Antes de mergulhar em funcionalidades específicas, vale a pena entender o que diferencia o Pydoll. Esses conceitos fundamentais informam como toda a biblioteca funciona.

**[Conceitos Principais](core-concepts.md)**: Descubra as decisões arquitetônicas que tornam o Pydoll diferente: a abordagem "zero-webdriver" que elimina dores de cabeça de compatibilidade, o design "async-first" que permite operações concorrentes verdadeiras, e o suporte nativo para múltiplos navegadores baseados em Chromium.

## Localização e Interação com Elementos

Encontrar e interagir com elementos da página é o pão com manteiga da automação. O Pydoll torna isso surpreendentemente intuitivo com APIs modernas que simplesmente fazem sentido.

**[Localização de Elementos](element-finding.md)**: Domine as estratégias de localização de elementos do Pydoll, desde o intuitivo método `find()` que usa atributos HTML naturais, até o poderoso método `query()` para seletores CSS e XPath. Você também aprenderá sobre auxiliares de travessia do DOM que permitem navegar pela estrutura da página eficientemente.

## Capacidades de Automação

Estas são as funcionalidades que dão vida à sua automação: simular interações do usuário, controle de teclado, lidar com operações de arquivo, trabalhar com iframes e capturar conteúdo visual.

**[Interações Semelhantes a Humanas](automation/human-interactions.md)**: Aprenda como criar interações que parecem genuinamente humanas: digitar com variações naturais de tempo, clicar com movimentos realistas do mouse e usar atalhos de teclado exatamente como um usuário real faria. Isso é crucial para evitar detecção em sites sensíveis à automação.

**[Controle de Teclado](automation/keyboard-control.md)**: Domine as interações de teclado com suporte abrangente para combinações de teclas, modificadores e teclas especiais. Essencial para formulários, atalhos e testes de acessibilidade.

**[Operações com Arquivos](automation/file-operations.md)**: O manuseio de arquivos pode ser complicado na automação de navegador. O Pydoll fornece soluções robustas tanto para uploads quanto para downloads, com o gerenciador de contexto `expect_download` oferecendo um manuseio elegante da conclusão assíncrona de downloads.

**[Interação com IFrames](automation/iframes.md)**: Trate iframes como qualquer elemento—encontre o iframe e continue pesquisando a partir dele. Sem targets extras, sem abas adicionais.

**[Capturas de Tela e PDF](automation/screenshots-and-pdfs.md)**: Capture conteúdo visual de suas sessões de automação. Se você precisa de capturas de tela de página inteira para testes de regressão visual, capturas de elementos específicos para depuração, ou exportações de PDF para arquivamento, o Pydoll tem o que você precisa.

## Funcionalidades de Rede

As capacidades de rede do Pydoll são onde ele realmente brilha, dando a você visibilidade e controle sem precedentes sobre o tráfego HTTP.

**[Monitoramento de Rede](network/monitoring.md)**: Observe e analise toda a atividade de rede em sua sessão de navegador. Extraia respostas de API, rastreie o tempo de requisição, identifique requisições falhas e entenda exatamente quais dados estão sendo trocados. Essencial para depuração, testes e extração de dados.

**[Interceptação de Requisições](network/interception.md)**: Vá além da observação para modificar ativamente o comportamento da rede. Bloqueie recursos indesejados, injete cabeçalhos personalizados, modifique payloads de requisição, ou até mesmo atenda requisições com dados mockados. Isso é poderoso para testes, otimização e controle de privacidade.

**[Requisições HTTP no Contexto do Navegador](network/http-requests.md)**: Faça requisições HTTP que executam dentro do contexto JavaScript do navegador, herdando automaticamente estado de sessão, cookies e autenticação. Esta abordagem híbrida combina a familiaridade da biblioteca `requests` do Python com os benefícios da execução no contexto do navegador.

## Gerenciamento do Navegador

O gerenciamento eficaz do navegador e das abas é essencial para cenários complexos de automação, processamento paralelo e testes multiusuário.

**[Gerenciamento de Múltiplas Abas](browser-management/tabs.md)**: Trabalhe com múltiplas abas do navegador simultaneamente, garantindo o uso eficiente de recursos enquanto lhe dá controle total sobre o ciclo de vida das abas, detecção de abas abertas pelo usuário e operações de scraping concorrentes.

**[Contextos do Navegador](browser-management/contexts.md)**: Crie ambientes de navegação completamente isolados dentro de um único processo de navegador. Cada contexto mantém cookies, armazenamento, cache e permissões separados: perfeito para testes de múltiplas contas, testes A/B, ou scraping paralelo com diferentes configurações.


**[Cookies e Sessões](browser-management/cookies-sessions.md)**: Gerencie o estado da sessão tanto no nível do navegador quanto no da aba. Defina cookies programaticamente, extraia dados de sessão e mantenha diferentes sessões entre contextos de navegador para cenários de testes sofisticados.


## Configuração

Personalize cada aspecto do comportamento do navegador para corresponder às suas necessidades de automação, desde preferências de baixo nível do Chromium até argumentos de linha de comando e estratégias de carregamento de página.

**[Opções do Navegador](configuration/browser-options.md)**: Configure os parâmetros de inicialização do Chromium, argumentos de linha de comando e controle do estado de carregamento da página. Ajuste fino do comportamento do navegador, ative recursos experimentais e otimize o desempenho para suas necessidades de automação.

**[Preferências do Navegador](configuration/browser-preferences.md)**: O acesso direto ao sistema interno de preferências do Chromium lhe dá controle sobre centenas de configurações. Configure downloads, desative funcionalidades, otimize o desempenho ou crie fingerprints de navegador realistas para automação furtiva.

**[Configuração de Proxy](configuration/proxy.md)**: Suporte nativo a proxy com capacidades completas de autenticação. Essencial para projetos de web scraping que exigem rotação de IP, testes geo-direcionados ou automação focada em privacidade.


## Funcionalidades Avançadas

Estas capacidades sofisticadas abordam desafios complexos de automação e casos de uso especializados.

**[Contorno de Captcha Comportamental](advanced/behavioral-captcha-bypass.md)**: O manejo nativo de captcha comportamental do Pydoll é uma de suas funcionalidades mais solicitadas. Aprenda como interagir com Cloudflare Turnstile, reCAPTCHA v3 e desafios invisíveis hCaptcha usando duas abordagens - gerenciador de contexto síncrono para conclusão garantida, e processamento em segundo plano para operação não bloqueante.

**[Sistema de Eventos](advanced/event-system.md)**: Construa automação reativa que responde a eventos do navegador em tempo real. Monitore carregamentos de página, atividade de rede, mudanças no DOM e execução de JavaScript para criar scripts de automação inteligentes e adaptativos.

**[Conexões Remotas](advanced/remote-connections.md)**: Conecte-se a navegadores já em execução via WebSocket para cenários de automação híbrida. Perfeito para pipelines de CI/CD, ambientes contêinerizados, ou integração do Pydoll em ferramentas CDP existentes.


## Como Usar Este Guia

Cada página de funcionalidade segue uma estrutura consistente:

1.  **Visão Geral** - O que a funcionalidade faz e por que ela é importante
2.  **Uso Básico** - Comece rapidamente com exemplos simples
3.  **Padrões Avançados** - Aproveite todo o potencial da funcionalidade
4.  **Melhores Práticas** - Dicas para uso eficaz e eficiente
5.  **Armadilhas Comuns** - Aprenda com os erros comuns

Sinta-se à vontade para explorar as funcionalidades em qualquer ordem com base em suas necessidades. Os exemplos de código são completos e estão prontos para rodar - apenas copie, cole e adapte ao seu caso de uso.

Pronto para mergulhar fundo nas capacidades do Pydoll? Escolha uma funcionalidade que lhe interessa e comece a explorar! 🚀

================================================
FILE: docs/pt/features/network/http-requests.md
================================================
# Requisições HTTP no Contexto do Navegador

Faça requisições HTTP que herdam automaticamente o estado de sessão, cookies e autenticação do seu navegador. Perfeito para automação híbrida, combinando navegação de UI com a eficiência de APIs.

!!! tip "Uma Revolução para Automação Híbrida"
    Já desejou poder fazer requisições HTTP que automaticamente obtêm todos os cookies e autenticação do seu navegador? Agora você pode! A propriedade `tab.request` oferece uma bela interface semelhante ao `requests` que executa chamadas HTTP **diretamente no contexto JavaScript do navegador**.

## Por que Usar Requisições no Contexto do Navegador?

A automação tradicional frequentemente exige que você extraia cookies e cabeçalhos manualmente para fazer chamadas de API. As requisições no contexto do navegador eliminam esse incômodo:

| Abordagem Tradicional | Requisições no Contexto do Navegador |
|---|---|
| Extrair cookies manualmente | Cookies herdados automaticamente |
| Gerenciar tokens de sessão | Estado da sessão preservado |
| Lidar com CORS separadamente | Políticas CORS respeitadas |
| Lidar com dois clientes HTTP | Uma interface unificada |
| Sincronizar estado de autenticação | Sempre autenticado |

**Perfeito para:**

- Raspar APIs autenticadas após login via UI
- Fluxos de trabalho híbridos misturando interação de navegador e chamadas de API
- Testar endpoints autenticados sem gerenciamento de token
- Contornar fluxos complexos de autenticação
- Trabalhar com aplicações de página única (SPAs)

## Guia Rápido

O exemplo mais simples: fazer login via UI e, em seguida, fazer chamadas de API autenticadas:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def hybrid_automation():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # 1. Faça login normalmente através da UI
        await tab.go_to('https://example.com/login')
        await (await tab.find(id='username')).type_text('user@example.com')
        await (await tab.find(id='password')).type_text('password123')
        await (await tab.find(id='login-btn')).click()
        
        # Aguarde o redirecionamento após o login
        await asyncio.sleep(2)
        
        # 2. Agora faça chamadas de API com a sessão autenticada!
        response = await tab.request.get('https://example.com/api/user/profile')
        user_data = response.json()
        
        print(f"Logado como: {user_data['name']}")
        print(f"Email: {user_data['email']}")

asyncio.run(hybrid_automation())
```

!!! success "Nenhum Gerenciamento de Cookie Necessário"
    Percebeu como não extraímos ou passamos nenhum cookie? A requisição herdou automaticamente a sessão autenticada do navegador!

## Casos de Uso Comuns

### 1. Raspagem de APIs Autenticadas

Use a UI para fazer login e, em seguida, dispare requisições às APIs para extração de dados:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def scrape_user_data():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Login via UI (lida com fluxos de autenticação complexos)
        await tab.go_to('https://app.example.com/login')
        await (await tab.find(id='email')).type_text('user@example.com')
        await (await tab.find(id='password')).type_text('password')
        await (await tab.find(type='submit')).click()
        await asyncio.sleep(2)
        
        # Agora extraia dados via API (muito mais rápido que raspar UI)
        all_users = []
        for page in range(1, 6):
            response = await tab.request.get(
                f'https://app.example.com/api/users',
                params={'page': str(page), 'limit': '100'}
            )
            users = response.json()['users']
            all_users.extend(users)
            print(f"Página {page}: buscou {len(users)} usuários")
        
        print(f"Total de usuários raspados: {len(all_users)}")

asyncio.run(scrape_user_data())
```

### 2. Testando Endpoints Protegidos

Teste endpoints de API sem gerenciar tokens de autenticação:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def test_api_endpoints():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Autentique uma vez
        await tab.go_to('https://api.example.com/login')
        # ... realize o login ...
        await asyncio.sleep(2)
        
        # Teste múltiplos endpoints
        endpoints = [
            '/api/users/me',
            '/api/settings',
            '/api/notifications',
            '/api/dashboard/stats'
        ]
        
        for endpoint in endpoints:
            response = await tab.request.get(f'https://api.example.com{endpoint}')
            
            if response.ok:
                print(f"Sucesso {endpoint}: {response.status_code}")
            else:
                print(f"Falha {endpoint}: {response.status_code}")
                print(f"   Erro: {response.text[:100]}")

asyncio.run(test_api_endpoints())
```

### 3. Enviando Formulários via API

Preencha formulários mais rapidamente postando diretamente para a API:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def bulk_form_submission():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Faça login primeiro
        await tab.go_to('https://crm.example.com/login')
        # ... lógica de login ...
        await asyncio.sleep(2)
        
        # Envie múltiplas entradas via API (muito mais rápido que preencher formulários)
        contacts = [
            {'name': 'John Doe', 'email': 'john@example.com', 'company': 'Acme Inc'},
            {'name': 'Jane Smith', 'email': 'jane@example.com', 'company': 'Tech Corp'},
            {'name': 'Bob Wilson', 'email': 'bob@example.com', 'company': 'StartupXYZ'},
        ]
        
        for contact in contacts:
            response = await tab.request.post(
                'https://crm.example.com/api/contacts',
                json=contact
            )
            
            if response.ok:
                print(f"Adicionado: {contact['name']}")
            else:
                print(f"Falha: {contact['name']} - {response.status_code}")

asyncio.run(bulk_form_submission())
```

### 4. Baixando Arquivos com Sessão

Baixe arquivos que exigem autenticação:

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def download_authenticated_file():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Autentique
        await tab.go_to('https://portal.example.com/login')
        # ... lógica de login ...
        await asyncio.sleep(2)
        
        # Baixe o arquivo que requer autenticação
        response = await tab.request.get(
            'https://portal.example.com/api/reports/monthly.pdf'
        )
        
        if response.ok:
            # Salve o arquivo
            output_path = Path('/tmp/monthly_report.pdf')
            output_path.write_bytes(response.content)
            print(f"Baixado: {output_path} ({len(response.content)} bytes)")
        else:
            print(f"Download falhou: {response.status_code}")

asyncio.run(download_authenticated_file())
```

### 5. Trabalhando com Cabeçalhos Personalizados

Adicione cabeçalhos personalizados às suas requisições:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.types import HeaderEntry

async def custom_headers_example():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Faça login primeiro
        await tab.go_to('https://api.example.com/login')
        # ... lógica de login ...
        
        # Faça requisição com cabeçalhos personalizados
        headers: list[HeaderEntry] = [
            {'name': 'X-API-Version', 'value': '2.0'},
            {'name': 'X-Request-ID', 'value': 'unique-id-123'},
            {'name': 'Accept-Language', 'value': 'pt-BR,pt;q=0.9'},
        ]
        
        response = await tab.request.get(
            'https://api.example.com/data',
            headers=headers
        )
        
        print(f"Status: {response.status_code}")
        print(f"Data: {response.json()}")

asyncio.run(custom_headers_example())
```

### 6. Lidando com Diferentes Tipos de Resposta

Acesse dados de resposta em múltiplos formatos:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def response_formats():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://api.example.com')
        
        # Resposta JSON
        json_response = await tab.request.get('/api/users/1')
        user = json_response.json()
        print(f"JSON: {user}")
        
        # Resposta de texto
        text_response = await tab.request.get('/api/status')
        status_text = text_response.text
        print(f"Texto: {status_text}")
        
        # Resposta binária (ex: imagem)
        image_response = await tab.request.get('/api/avatar/1')
        image_bytes = image_response.content
        print(f"Binário: {len(image_bytes)} bytes")
        
        # Verificar status da resposta
        if json_response.ok:
            print("Requisição bem-sucedida!")
        
        # Acessar URL da resposta (útil após redirecionamentos)
        print(f"URL Final: {json_response.url}")

asyncio.run(response_formats())
```

## Métodos HTTP

Todos os métodos HTTP padrão são suportados:

### GET - Recuperar Dados

```python
# GET simples
response = await tab.request.get('https://api.example.com/users')

# GET com parâmetros de consulta
response = await tab.request.get(
    'https://api.example.com/search',
    params={'q': 'python', 'limit': '10'}
)
```

### POST - Criar Recursos

```python
# POST com dados JSON
response = await tab.request.post(
    'https://api.example.com/users',
    json={'name': 'John Doe', 'email': 'john@example.com'}
)

# POST com dados de formulário
response = await tab.request.post(
    'https://api.example.com/login',
    data={'username': 'john', 'password': 'secret'}
)
```

### PUT - Atualizar Recursos

```python
# Atualizar recurso inteiro
response = await tab.request.put(
    'https://api.example.com/users/123',
    json={'name': 'Jane Doe', 'email': 'jane@example.com', 'role': 'admin'}
)
```

### PATCH - Atualizações Parciais

```python
# Atualizar campos específicos
response = await tab.request.patch(
    'https://api.example.com/users/123',
    json={'email': 'newemail@example.com'}
)
```

### DELETE - Remover Recursos

```python
# Deletar um recurso
response = await tab.request.delete('https://api.example.com/users/123')
```

### HEAD - Obter Apenas Cabeçalhos

```python
# Verificar se o recurso existe sem baixá-lo
response = await tab.request.head('https://example.com/large-file.zip')
print(f"Content-Length: {response.headers}")
```

### OPTIONS - Verificar Capacidades

```python
# Verificar métodos permitidos
response = await tab.request.options('https://api.example.com/users')
print(f"Métodos permitidos: {response.headers}")
```

!!! info "Como Isso Funciona?"
    Requisições no contexto do navegador executam chamadas HTTP diretamente no contexto JavaScript do navegador usando a API Fetch, enquanto monitoram eventos de rede CDP para capturar metadados abrangentes (cabeçalhos, cookies, tempo).
    
    Para uma explicação detalhada da arquitetura interna, monitoramento de eventos e detalhes de implementação, veja a [Arquitetura de Requisições do Navegador](../../deep-dive/browser-requests-architecture.md).

## Objeto Response

O objeto `Response` fornece uma interface familiar semelhante ao `requests.Response`:

```python
response = await tab.request.get('https://api.example.com/users')

# Código de status
print(response.status_code)  # 200, 404, 500, etc.

# Verificar se foi bem-sucedido (2xx ou 3xx)
if response.ok:
    print("Sucesso!")

# Corpo da resposta
text_data = response.text      # Como string
byte_data = response.content   # Como bytes
json_data = response.json()    # JSON parseado

# Cabeçalhos
for header in response.headers:
    print(f"{header['name']}: {header['value']}")

# Cabeçalhos da requisição (o que foi realmente enviado)
for header in response.request_headers:
    print(f"{header['name']}: {header['value']}")

# Cookies definidos pela resposta
for cookie in response.cookies:
    print(f"{cookie['name']} = {cookie['value']}")

# URL final (após redirecionamentos)
print(response.url)

# Lançar exceção para códigos de status de erro
response.raise_for_status()  # Lança HTTPError se for 4xx ou 5xx
```

!!! note "Redirecionamentos e Rastreamento de URL"
    A propriedade `response.url` contém apenas a **URL final** após todos os redirecionamentos. Se você precisar rastrear a cadeia completa de redirecionamento (URLs intermediárias, códigos de status, tempo), use o [Monitoramento de Rede](monitoring.md) para observar todas as requisições em detalhes.

## Cabeçalhos e Cookies

### Trabalhando com Cabeçalhos

Cabeçalhos são representados como objetos `HeaderEntry`:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.types import HeaderEntry

async def header_example():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Usando o tipo HeaderEntry para autocompletar da IDE e verificação de tipo
        headers: list[HeaderEntry] = [
            {'name': 'Authorization', 'value': 'Bearer token-123'},
            {'name': 'X-Custom-Header', 'value': 'custom-value'},
        ]
        
        response = await tab.request.get(
            'https://api.example.com/protected',
            headers=headers
        )
        
        # Inspecionar cabeçalhos de resposta (também são dicts tipados HeaderEntry)
        for header in response.headers:
            if header['name'] == 'Content-Type':
                print(f"Content-Type: {header['value']}")

asyncio.run(header_example())
```

!!! tip "Dicas de Tipo para Cabeçalhos"
    `HeaderEntry` é um `TypedDict` de `pydoll.protocol.fetch.types`. Usá-lo como uma dica de tipo oferece a você:
    
    - **Autocompletar**: IDE sugere chaves `name` e `value`
    - **Segurança de tipo**: Pega erros de digitação e chaves faltantes antes de rodar
    - **Documentação**: Estrutura clara para cabeçalhos
    
    Embora você possa passar dicionários simples, usar a dica de tipo melhora a qualidade do código e o suporte da IDE.

!!! tip "Comportamento de Cabeçalhos Personalizados"
    Cabeçalhos personalizados são enviados **juntamente com** os cabeçalhos automáticos do navegador (como `User-Agent`, `Accept`, `Referer`, etc.). 
    
    Se você tentar definir um cabeçalho padrão do navegador (ex: `User-Agent`), o comportamento depende do cabeçalho específico; alguns podem ser sobrescritos, outros ignorados, e alguns podem causar conflitos. Para a maioria dos casos de uso, atenha-se a cabeçalhos personalizados (ex: `X-API-Key`, `Authorization`) para evitar comportamentos inesperados.

### Entendendo Cookies

Cookies são gerenciados automaticamente pelo navegador:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def cookie_example():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Primeira requisição define cookies
        login_response = await tab.request.post(
            'https://api.example.com/login',
            json={'username': 'user', 'password': 'pass'}
        )
        
        # Verificar cookies definidos pelo servidor
        print("Cookies definidos pelo servidor:")
        for cookie in login_response.cookies:
            print(f"  {cookie['name']} = {cookie['value']}")
        
        # Requisições subsequentes incluem cookies automaticamente
        profile_response = await tab.request.get(
            'https://api.example.com/profile'
        )
        # Não é preciso passar cookies - o navegador cuida disso!
        
        print(f"Dados do perfil: {profile_response.json()}")

asyncio.run(cookie_example())
```

## Comparação com Requisições Tradicionais

| Funcionalidade | Biblioteca `requests` | Requisições no Contexto do Navegador |
|---|---|---|
| **Gerenciamento de Sessão** | Manual (cookies) | Automático via navegador |
| **Autenticação** | Extrair e passar tokens | Herdada do navegador |
| **CORS** | Não aplicável | Navegador impõe políticas |
| **JavaScript** | Não pode executar | Acesso total ao contexto do navegador |
| **Armazenamento de Cookies** | Instância separada | Armazenamento nativo de cookies do navegador |
| **Cabeçalhos** | Definidos manualmente | Navegador adiciona cabeçalhos padrão |
| **Caso de Uso** | Scripts do lado do servidor | Automação de navegador |
| **Configuração** | Biblioteca externa | Embutido no Pydoll |

## Veja Também

- **[Arquitetura de Requisições do Navegador](../../deep-dive/browser-requests-architecture.md)** - Implementação interna e arquitetura
- **[Monitoramento de Rede](monitoring.md)** - Observe todo o tráfego de rede
- **[Interceptação de Requisições](interception.md)** - Modifique requisições antes de serem enviadas
- **[Sistema de Eventos](../advanced/event-system.md)** - Reaja a eventos do navegador
- **[Análise Profunda: Capacidades de Rede](../../deep-dive/network-capabilities.md)** - Detalhes técnicos

Requisições no contexto do navegador são uma virada de jogo para automação híbrida. Combine o poder da automação de UI com a velocidade de chamadas diretas de API, tudo isso mantendo a continuidade perfeita da sessão!

================================================
FILE: docs/pt/features/network/interception.md
================================================
# Interceptação de Requisições

A interceptação de requisições permite que você intercepte, modifique, bloqueie ou simule (mock) requisições e respostas HTTP em tempo real. Isso é essencial para testes, otimização de desempenho, filtragem de conteúdo e simulação de várias condições de rede.

!!! info "Domínio Network vs Fetch"
    O **domínio Network** é para monitoramento passivo (observar o tráfego). O **domínio Fetch** é para interceptação ativa (modificar/bloquear requisições). Este guia foca na interceptação. Para monitoramento passivo, veja [Monitoramento de Rede](monitoring.md).

## Entendendo a Interceptação de Requisições

Quando você habilita a interceptação de requisições, o Pydoll pausa as requisições correspondentes antes que elas sejam enviadas ao servidor (ou após receber a resposta). Você então tem três opções:

1.  **Continuar**: Deixar a requisição prosseguir (opcionalmente com modificações)
2.  **Bloquear**: Falhar a requisição com um erro
3.  **Simular (Mock)**: Atender à requisição com uma resposta personalizada

```mermaid
sequenceDiagram
    participant Browser
    participant Pydoll
    participant Server
    
    Browser->>Pydoll: Requisição iniciada
    Note over Pydoll: Requisição Pausada
    Pydoll->>Pydoll: Callback executado
    
    alt Continuar
        Pydoll->>Server: Encaminhar requisição
        Server-->>Browser: Resposta
    else Bloquear
        Pydoll-->>Browser: Resposta de erro
    else Simular (Mock)
        Pydoll-->>Browser: Resposta personalizada
    end
```

!!! warning "Impacto no Desempenho"
    A interceptação de requisições adiciona latência a cada requisição correspondente. Intercepte apenas o que você precisa e desabilite quando terminar para evitar lentidão no carregamento das páginas.

## Habilitando a Interceptação de Requisições

Antes de interceptar requisições, você deve habilitar o domínio Fetch:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def main():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Habilitar eventos fetch (intercepta todas as requisições por padrão)
        await tab.enable_fetch_events()
        
        await tab.go_to('https://example.com')
        
        # Desabilitar quando terminar
        await tab.disable_fetch_events()

asyncio.run(main())
```

### Interceptação Seletiva

Você pode filtrar quais requisições interceptar por tipo de recurso:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def selective_interception():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Interceptar apenas imagens e folhas de estilo
        await tab.enable_fetch_events(
            resource_type='Image'  # Ou 'Stylesheet', 'Script', etc.
        )
        
        await tab.go_to('https://example.com')
        await tab.disable_fetch_events()

asyncio.run(selective_interception())
```

!!! tip "Tipos de Recurso"
    Veja a seção [Referência de Tipos de Recurso](#referência-de-tipos-de-recurso) para uma lista completa de tipos de recursos interceptáveis.

## Interceptando Requisições

Use o evento `RequestPaused` para interceptar requisições:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent

async def basic_interception():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Callback com dica de tipo para suporte da IDE
        async def handle_request(event: RequestPausedEvent):
            request_id = event['params']['requestId']
            url = event['params']['request']['url']
            
            print(f"Interceptado: {url}")
            
            # Continuar a requisição sem modificações
            await tab.continue_request(request_id)
        
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, handle_request)
        
        await tab.go_to('https://example.com')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(basic_interception())
```

!!! info "Dicas de Tipo para Melhor Suporte da IDE"
    Use dicas de tipo como `RequestPausedEvent` para obter autocompletar para as chaves do evento. Todos os tipos de evento estão em `pydoll.protocol.fetch.events`.

!!! note "Espera Pronta para Produção"
    Os exemplos neste guia usam `asyncio.sleep()` por simplicidade. Em código de produção, considere usar estratégias de espera mais explícitas, como esperar por elementos específicos ou implementar detecção de ociosidade da rede. Veja o guia [Monitoramento de Rede](monitoring.md) para técnicas avançadas.

## Casos de Uso Comuns

### 1. Bloqueando Recursos para Economizar Banda

Bloqueie imagens, folhas de estilo ou outros recursos para acelerar o carregamento da página:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent
from pydoll.protocol.network.types import ErrorReason

async def block_images():
    async with Chrome() as browser:
        tab = await browser.start()
        
        blocked_count = 0
        
        async def block_resource(event: RequestPausedEvent):
            nonlocal blocked_count
            request_id = event['params']['requestId']
            resource_type = event['params']['resourceType']
            url = event['params']['request']['url']
            
            # Bloquear imagens e folhas de estilo
            if resource_type in ['Image', 'Stylesheet']:
                blocked_count += 1
                print(f"🚫 Bloqueado {resource_type}: {url[:60]}")
                await tab.fail_request(request_id, ErrorReason.BLOCKED_BY_CLIENT)
            else:
                # Continuar outras requisições
                await tab.continue_request(request_id)
        
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, block_resource)
        
        await tab.go_to('https://example.com')
        await asyncio.sleep(3)
        
        print(f"\n📊 Total bloqueado: {blocked_count} recursos")
        
        await tab.disable_fetch_events()

asyncio.run(block_images())
```

### 2. Modificando Cabeçalhos de Requisição

Adicione, modifique ou remova cabeçalhos antes que as requisições sejam enviadas:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent
from pydoll.protocol.fetch.types import HeaderEntry

async def modify_headers():
    async with Chrome() as browser:
        tab = await browser.start()
        
        async def add_custom_headers(event: RequestPausedEvent):
            request_id = event['params']['requestId']
            url = event['params']['request']['url']
            
            # Modificar apenas requisições de API
            if '/api/' in url:
                # Construir cabeçalhos personalizados (usando dica de tipo HeaderEntry para suporte da IDE)
                headers: list[HeaderEntry] = [
                    {'name': 'X-Custom-Header', 'value': 'MyValue'},
                    {'name': 'Authorization', 'value': 'Bearer my-token-123'},
                ]
                
                print(f"✨ Cabeçalhos modificados para: {url}")
                await tab.continue_request(request_id, headers=headers)
            else:
                await tab.continue_request(request_id)
        
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, add_custom_headers)
        
        await tab.go_to('https://your-app.com')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(modify_headers())
```

!!! tip "Dicas de Tipo para Cabeçalhos"
    `HeaderEntry` é um `TypedDict` de `pydoll.protocol.fetch.types`. Usá-lo como uma dica de tipo oferece autocompletar da IDE para as chaves `name` e `value`. Você também pode usar dicionários simples sem a dica de tipo.

!!! tip "Gerenciamento de Cabeçalhos"
    Quando você fornece cabeçalhos personalizados, eles **substituem** todos os cabeçalhos existentes. Certifique-se de incluir os cabeçalhos necessários, como `User-Agent`, `Accept`, etc., se necessário.

### 3. Simulando (Mocking) Respostas de API

Substitua respostas reais de API por dados simulados personalizados:

```python
import asyncio
import json
import base64
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent
from pydoll.protocol.fetch.types import HeaderEntry

async def mock_api_responses():
    async with Chrome() as browser:
        tab = await browser.start()
        
        async def mock_response(event: RequestPausedEvent):
            request_id = event['params']['requestId']
            url = event['params']['request']['url']
            
            # Simular endpoint de API específico
            if '/api/users' in url:
                # Criar dados de resposta simulada
                mock_data = {
                    'users': [
                        {'id': 1, 'name': 'Mock User 1'},
                        {'id': 2, 'name': 'Mock User 2'},
                    ],
                    'total': 2
                }
                
                # Converter para JSON e codificar em base64
                body_json = json.dumps(mock_data)
                body_base64 = base64.b64encode(body_json.encode()).decode()
                
                # Cabeçalhos da resposta
                headers: list[HeaderEntry] = [
                    {'name': 'Content-Type', 'value': 'application/json'},
                    {'name': 'Access-Control-Allow-Origin', 'value': '*'},
                ]
                
                print(f"🎭 Resposta simulada para: {url}")
                await tab.fulfill_request(
                    request_id=request_id,
                    response_code=200,
                    response_headers=headers,
                    body=body_base64,
                    response_phrase='OK'
                )
            else:
                # Continuar outras requisições normalmente
                await tab.continue_request(request_id)
        
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, mock_response)
        
        await tab.go_to('https://your-app.com')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(mock_api_responses())
```

!!! warning "Codificação Base64 Obrigatória"
    O parâmetro `body` em `fulfill_request()` deve ser codificado em base64. Use o módulo `base64` do Python para codificar seus dados de resposta.

### 4. Modificando URLs de Requisição

Redirecione requisições para URLs diferentes:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent

async def redirect_requests():
    async with Chrome() as browser:
        tab = await browser.start()
        
        async def redirect_url(event: RequestPausedEvent):
            request_id = event['params']['requestId']
            original_url = event['params']['request']['url']
            
            # Redirecionar requisições de CDN para servidor local
            if 'cdn.example.com' in original_url:
                new_url = original_url.replace(
                    'cdn.example.com',
                    'localhost:8080'
                )
                print(f"🔀 Redirecionado: {original_url} → {new_url}")
                await tab.continue_request(request_id, url=new_url)
            else:
                await tab.continue_request(request_id)
        
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, redirect_url)
        
        await tab.go_to('https://example.com')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(redirect_requests())
```

### 5. Modificando Corpo da Requisição

Modifique dados POST antes de enviar:

```python
import asyncio
import base64
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent

async def modify_post_data():
    async with Chrome() as browser:
        tab = await browser.start()
        
        async def modify_body(event: RequestPausedEvent):
            request_id = event['params']['requestId']
            method = event['params']['request']['method']
            url = event['params']['request']['url']
            
            # Modificar requisições POST
            if method == 'POST' and '/api/submit' in url:
                # Criar novos dados POST
                new_data = '{"modified": true, "timestamp": 123456789}'
                post_data_base64 = base64.b64encode(new_data.encode()).decode()
                
                print(f"✏️  Dados POST modificados para: {url}")
                await tab.continue_request(
                    request_id,
                    post_data=post_data_base64
                )
            else:
                await tab.continue_request(request_id)
        
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, modify_body)
        
        await tab.go_to('https://your-app.com/form')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(modify_post_data())
```

### 6. Lidando com Desafios de Autenticação

Responda manualmente a desafios de autenticação HTTP (Basic Auth, Digest Auth, etc.):

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, AuthRequiredEvent
from pydoll.protocol.fetch.types import AuthChallengeResponseType

async def handle_auth():
    async with Chrome() as browser:
        tab = await browser.start()
        
        async def respond_to_auth(event: AuthRequiredEvent):
            request_id = event['params']['requestId']
            auth_challenge = event['params']['authChallenge']
            
            print(f"🔐 Desafio de autenticação de: {auth_challenge['origin']}")
            print(f"   Esquema: {auth_challenge['scheme']}")
            print(f"   Realm: {auth_challenge.get('realm', 'N/A')}")
            
            # Fornecer credenciais para o desafio de autenticação
            await tab.continue_with_auth(
                request_id=request_id,
                auth_challenge_response=AuthChallengeResponseType.PROVIDE_CREDENTIALS,
                proxy_username='myuser',
                proxy_password='mypassword'
            )
        
        # Habilitar com tratamento de autenticação
        await tab.enable_fetch_events(handle_auth=True)
        await tab.on(FetchEvent.AUTH_REQUIRED, respond_to_auth)
        
        await tab.go_to('https://httpbin.org/basic-auth/myuser/mypassword')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(handle_auth())
```

!!! note "Autenticação Automática de Proxy"
    **O Pydoll lida automaticamente com a autenticação de proxy** (407 Proxy Authentication Required) quando você configura credenciais de proxy através das opções do navegador. Este exemplo demonstra o **tratamento manual** de desafios de autenticação, que é útil para:
    
    - Autenticação HTTP Basic/Digest de servidores (401 Unauthorized)
    - Fluxos de autenticação personalizados
    - Seleção dinâmica de credenciais com base no desafio
    - Testar cenários de falha de autenticação
    
    Para uso padrão de proxy, simplesmente configure suas credenciais de proxy nas opções do navegador - não é necessário tratamento manual!

### 7. Simulando Erros de Rede

Teste como sua aplicação lida com falhas de rede:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent
from pydoll.protocol.network.types import ErrorReason

async def simulate_errors():
    async with Chrome() as browser:
        tab = await browser.start()
        
        request_count = 0
        
        async def fail_some_requests(event: RequestPausedEvent):
            nonlocal request_count
            request_id = event['params']['requestId']
            url = event['params']['request']['url']
            
            request_count += 1
            
            # Falhar a cada 3ª requisição
            if request_count % 3 == 0:
                print(f"❌ Simulando timeout para: {url[:60]}")
                await tab.fail_request(request_id, ErrorReason.TIMED_OUT)
            else:
                await tab.continue_request(request_id)
        
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, fail_some_requests)
        
        await tab.go_to('https://example.com')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(simulate_errors())
```

## Estágios da Requisição

Você pode interceptar requisições em diferentes estágios:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.types import RequestStage

async def intercept_responses():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Interceptar respostas em vez de requisições
        await tab.enable_fetch_events(request_stage=RequestStage.RESPONSE)
        
        # Agora você pode modificar respostas antes que elas cheguem à página
        await tab.go_to('https://example.com')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(intercept_responses())
```

| Estágio | Quando Interceptado | Casos de Uso |
|---|---|---|
| `Request` (padrão) | Antes da requisição ser enviada | Modificar cabeçalhos, bloquear requisições, mudar URL |
| `Response` | Após a resposta ser recebida | Modificar corpo da resposta, mudar códigos de status |

!!! tip "Interceptação de Resposta"
    Ao interceptar respostas, você pode usar `intercept_response=True` em `continue_request()` para também interceptar a resposta para aquela requisição específica.

## Referência de Tipos de Recurso

| Tipo de Recurso | Descrição | Extensões de Arquivo Comuns |
|---|---|---|
| `Document` | Documentos HTML | `.html` |
| `Stylesheet` | Arquivos CSS | `.css` |
| `Image` | Recursos de imagem | `.jpg`, `.png`, `.gif`, `.webp`, `.svg` |
| `Media` | Áudio/vídeo | `.mp4`, `.webm`, `.mp3`, `.ogg` |
| `Font` | Fontes web | `.woff`, `.woff2`, `.ttf`, `.otf` |
| `Script` | JavaScript | `.js` |
| `TextTrack` | Legendas | `.vtt`, `.srt` |
| `XHR` | XMLHttpRequest | Requisições AJAX |
| `Fetch` | API Fetch | Chamadas de API modernas |
| `EventSource` | Server-Sent Events | Streams em tempo real |
| `WebSocket` | WebSocket | Comunicação bidirecional |
| `Manifest` | Manifesto de aplicativo web | Configuração de PWA |
| `Other` | Outros tipos | Diversos |

## Referência de Razões de Erro

Use estes com `fail_request()` para simular diferentes falhas de rede:

| Razão do Erro | Descrição | Caso de Uso |
|---|---|---|
| `FAILED` | Falha genérica | Erro geral |
| `ABORTED` | Requisição abortada | Usuário cancelou |
| `TIMED_OUT` | Timeout da requisição | Timeout de rede |
| `ACCESS_DENIED` | Acesso negado | Erro de permissão |
| `CONNECTION_CLOSED` | Conexão fechada | Servidor desconectou |
| `CONNECTION_RESET` | Conexão resetada | Reset de rede |
| `CONNECTION_REFUSED` | Conexão recusada | Servidor inacessível |
| `NAME_NOT_RESOLVED` | Falha no DNS | Hostname inválido |
| `INTERNET_DISCONNECTED` | Sem internet | Modo offline |
| `BLOCKED_BY_CLIENT` | Bloqueado pelo cliente | Simulação de ad blocker |
| `BLOCKED_BY_RESPONSE` | Resposta bloqueada | Violação de CORS/CSP |

## Melhores Práticas

### 1. Sempre Continue ou Falhe as Requisições

```python
# Bom: Toda requisição pausada é tratada
async def handle_request(event: RequestPausedEvent):
    request_id = event['params']['requestId']
    try:
        # Sua lógica aqui
        await tab.continue_request(request_id)
    except Exception as e:
        # Falhar em caso de erro para evitar travamento
        await tab.fail_request(request_id, ErrorReason.FAILED)

# Ruim: Requisição pode travar se o callback lançar exceção
async def handle_request(event: RequestPausedEvent):
    request_id = event['params']['requestId']
    # Se isso lançar exceção, a requisição trava para sempre
    await tab.continue_request(request_id)
```

### 2. Use Interceptação Seletiva

```python
# Bom: Intercepte apenas o que você precisa
await tab.enable_fetch_events(resource_type='Image')

# Ruim: Intercepta tudo, torna todas as requisições mais lentas
await tab.enable_fetch_events()
```

### 3. Desabilite Quando Terminar

```python
# Bom: Limpe depois de usar
await tab.enable_fetch_events()
# ... faça o trabalho ...
await tab.disable_fetch_events()

# Ruim: Deixa a interceptação habilitada
await tab.enable_fetch_events()
# ... faça o trabalho ...
# (nunca desabilitado)
```

### 4. Trate Erros Graciosamente

```python
# Bom: Envolva em try/except
async def safe_handler(event: RequestPausedEvent):
    request_id = event['params']['requestId']
    try:
        # Lógica complexa que pode falhar
        modified_url = transform_url(event['params']['request']['url'])
        await tab.continue_request(request_id, url=modified_url)
    except Exception as e:
        print(f"Erro ao tratar requisição: {e}")
        # Continue sem modificações em caso de erro
        await tab.continue_request(request_id)
```

## Exemplo Completo: Controle Avançado de Requisições

Aqui está um exemplo completo combinando múltiplas técnicas de interceptação:

```python
import asyncio
import base64
import json
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent
from pydoll.protocol.fetch.types import HeaderEntry
from pydoll.protocol.network.types import ErrorReason

async def advanced_interception():
    async with Chrome() as browser:
        tab = await browser.start()
        
        stats = {
            'blocked': 0,
            'mocked': 0,
            'modified': 0,
            'continued': 0
        }
        
        async def intelligent_handler(event: RequestPausedEvent):
            request_id = event['params']['requestId']
            url = event['params']['request']['url']
            resource_type = event['params']['resourceType']
            method = event['params']['request']['method']
            
            try:
                # Bloquear anúncios e rastreadores
                if any(tracker in url for tracker in ['analytics', 'ads', 'tracking']):
                    stats['blocked'] += 1
                    print(f"🚫 Bloqueado rastreador: {url[:50]}")
                    await tab.fail_request(request_id, ErrorReason.BLOCKED_BY_CLIENT)
                
                # Simular (mock) respostas de API
                elif '/api/config' in url:
                    stats['mocked'] += 1
                    mock_config = {'feature_x': True, 'debug_mode': False}
                    body = base64.b64encode(json.dumps(mock_config).encode()).decode()
                    headers: list[HeaderEntry] = [
                        {'name': 'Content-Type', 'value': 'application/json'},
                    ]
                    print(f"🎭 API de configuração simulada")
                    await tab.fulfill_request(
                        request_id, 200, headers, body, 'OK'
                    )
                
                # Adicionar cabeçalhos de autenticação a requisições de API
                elif '/api/' in url and method == 'GET':
                    stats['modified'] += 1
                    headers: list[HeaderEntry] = [
                        {'name': 'Authorization', 'value': 'Bearer token-123'},
                    ]
                    print(f"✨ Adicionado auth para: {url[:50]}")
                    await tab.continue_request(request_id, headers=headers)
                
                # Continuar todo o resto normalmente
                else:
                    stats['continued'] += 1
                    await tab.continue_request(request_id)
                    
            except Exception as e:
                print(f"⚠️  Erro ao tratar requisição: {e}")
                # Sempre continuar em caso de erro para evitar travamento
                await tab.continue_request(request_id)
        
        # Habilitar interceptação
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, intelligent_handler)
        
        # Navegar
        await tab.go_to('https://example.com')
        await asyncio.sleep(5)
        
        # Imprimir estatísticas
        print(f"\n📊 Estatísticas de Interceptação:")
        print(f"   Bloqueados: {stats['blocked']}")
        print(f"   Simulados: {stats['mocked']}")
        print(f"   Modificados: {stats['modified']}")
        print(f"   Continuados: {stats['continued']}")
        print(f"   Total: {sum(stats.values())}")
        
        # Limpeza
        await tab.disable_fetch_events()

asyncio.run(advanced_interception())
```

## Veja Também

- **[Monitoramento de Rede](monitoring.md)** - Observação passiva de tráfego de rede
- **[Domínio Fetch do CDP](../../deep-dive/network-capabilities.md#fetch-domain)** - Análise profunda sobre o domínio Fetch
- **[Sistema de Eventos](../advanced/event-system.md)** - Entendendo a arquitetura de eventos do Pydoll

A interceptação de requisições é uma ferramenta poderosa para testes, otimização e simulação (mocking). Domine essas técnicas para construir scripts de automação de navegador robustos e eficientes.

================================================
FILE: docs/pt/features/network/monitoring.md
================================================
# Monitoramento de Rede

O monitoramento de rede no Pydoll permite observar e analisar requisições HTTP, respostas e outras atividades de rede durante a automação do navegador. Isso é essencial para depuração, análise de desempenho, testes de API e para entender como as aplicações web se comunicam com os servidores.

!!! info "Domínio Network vs Fetch"
    O **domínio Network** é para monitoramento passivo (observar o tráfego). O **domínio Fetch** é para interceptação ativa (modificar requisições/respostas). Este guia foca no monitoramento. Para interceptação de requisições, veja a documentação avançada.

## Habilitando Eventos de Rede

Antes de poder monitorar a atividade de rede, você deve habilitar o domínio Network:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def main():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Habilitar monitoramento de rede
        await tab.enable_network_events()
        
        # Agora navegue
        await tab.go_to('https://api.github.com')
        
        # Não se esqueça de desabilitar quando terminar (opcional, mas recomendado)
        await tab.disable_network_events()

asyncio.run(main())
```

!!! warning "Habilite Antes de Navegar"
    Sempre habilite os eventos de rede **antes** de navegar para capturar todas as requisições. Requisições feitas antes da habilitação não serão capturadas.

## Obtendo Logs de Rede

O Pydoll armazena automaticamente os logs de rede quando os eventos de rede estão habilitados. Você pode recuperá-los usando `get_network_logs()`:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def analyze_requests():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        
        # Navegar para uma página
        await tab.go_to('https://httpbin.org/json')
        
        # Esperar a página carregar completamente
        await asyncio.sleep(2)
        
        # Obter todos os logs de rede
        logs = await tab.get_network_logs()
        
        print(f"Total de requisições capturadas: {len(logs)}")
        
        for log in logs:
            request = log['params']['request']
            print(f"→ {request['method']} {request['url']}")

asyncio.run(analyze_requests())
```

!!! note "Espera Pronta para Produção"
    Os exemplos acima usam `asyncio.sleep(2)` por simplicidade. Em código de produção, considere usar estratégias de espera mais explícitas:
    
    - Esperar por elementos específicos aparecerem
    - Usar o [Sistema de Eventos](../advanced/event-system.md) para detectar quando todos os recursos foram carregados
    - Implementar detecção de ociosidade da rede (veja a seção Monitoramento de Rede em Tempo Real)
    
    Isso garante que sua automação espere exatamente o tempo necessário, nem mais, nem menos.

### Filtrando Logs de Rede

Você pode filtrar logs por padrão de URL:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def filter_logs_example():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        await tab.go_to('https://example.com')
        await asyncio.sleep(2)
        
        # Obter todos os logs
        all_logs = await tab.get_network_logs()
        
        # Obter logs para um domínio específico
        api_logs = await tab.get_network_logs(filter='api.example.com')
        
        # Obter logs para um endpoint específico
        user_logs = await tab.get_network_logs(filter='/api/users')

asyncio.run(filter_logs_example())
```

## Entendendo a Estrutura de Eventos de Rede

Os logs de rede contêm informações detalhadas sobre cada requisição. Aqui está a estrutura:

### Evento RequestWillBeSent

Este evento é disparado quando uma requisição está prestes a ser enviada:

```python
{
    'method': 'Network.requestWillBeSent',
    'params': {
        'requestId': 'unique-request-id',
        'loaderId': 'loader-id',
        'documentURL': 'https://example.com',
        'request': {
            'url': 'https://api.example.com/data',
            'method': 'GET',  # ou 'POST', 'PUT', 'DELETE', etc.
            'headers': {
                'User-Agent': 'Chrome/...',
                'Accept': 'application/json',
                ...
            },
            'postData': '...',  # Presente apenas para requisições POST/PUT
            'initialPriority': 'High',
            'referrerPolicy': 'strict-origin-when-cross-origin'
        },
        'timestamp': 1234567890.123,
        'wallTime': 1234567890.123,
        'initiator': {
            'type': 'script',  # ou 'parser', 'other'
            'stack': {...}  # Call stack se iniciado por script
        },
        'type': 'XHR',  # Tipo de recurso: Document, Script, Image, XHR, etc.
        'frameId': 'frame-id',
        'hasUserGesture': False
    }
}
```

### Referência de Campos Chave

| Campo | Localização | Tipo | Descrição |
|---|---|---|---|
| `requestId` | `params.requestId` | `str` | Identificador único para esta requisição |
| `url` | `params.request.url` | `str` | URL completa da requisição |
| `method` | `params.request.method` | `str` | Método HTTP (GET, POST, etc.) |
| `headers` | `params.request.headers` | `dict` | Cabeçalhos da requisição |
| `postData` | `params.request.postData` | `str` | Corpo da requisição (POST/PUT) |
| `timestamp` | `params.timestamp` | `float` | Tempo monotônico quando a requisição iniciou |
| `type` | `params.type` | `str` | Tipo de recurso (Document, XHR, Image, etc.) |
| `initiator` | `params.initiator` | `dict` | O que disparou esta requisição |

## Obtendo Corpos de Resposta

Para obter o conteúdo real da resposta, use `get_network_response_body()`:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def fetch_api_response():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        
        # Navegar para o endpoint da API
        await tab.go_to('https://httpbin.org/json')
        await asyncio.sleep(2)
        
        # Obter todas as requisições
        logs = await tab.get_network_logs()
        
        for log in logs:
            request_id = log['params']['requestId']
            url = log['params']['request']['url']
            
            # Obter resposta apenas para o endpoint JSON
            if 'httpbin.org/json' in url:
                try:
                    # Obter corpo da resposta
                    response_body = await tab.get_network_response_body(request_id)
                    print(f"Resposta de {url}:")
                    print(response_body)
                except Exception as e:
                    print(f"Não foi possível obter o corpo da resposta: {e}")

asyncio.run(fetch_api_response())
```

!!! warning "Disponibilidade do Corpo da Resposta"
    Corpos de resposta estão disponíveis apenas para requisições que foram concluídas. Além disso, alguns tipos de resposta (como imagens ou redirecionamentos) podem não ter corpos acessíveis.

## Casos de Uso Práticos

### 1. Teste e Validação de API

Monitore chamadas de API para verificar se as requisições corretas estão sendo feitas:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def validate_api_calls():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        
        # Navegar para sua aplicação
        await tab.go_to('https://your-app.com')
        
        # Disparar alguma ação que faça chamadas de API
        button = await tab.find(id='load-data-button')
        await button.click()
        await asyncio.sleep(2)
        
        # Obter logs da API
        api_logs = await tab.get_network_logs(filter='/api/')
        
        print(f"\n📊 Resumo das Chamadas de API:")
        print(f"Total de chamadas de API: {len(api_logs)}")
        
        for log in api_logs:
            request = log['params']['request']
            method = request['method']
            url = request['url']
            
            # Verificar se o cabeçalho de autenticação correto está presente
            headers = request.get('headers', {})
            has_auth = 'Authorization' in headers or 'authorization' in headers
            
            print(f"\n{method} {url}")
            print(f"  ✓ Possui Autorização: {has_auth}")
            
            # Validar dados POST se aplicável
            if method == 'POST' and 'postData' in request:
                print(f"  📤 Corpo: {request['postData'][:100]}...")

asyncio.run(validate_api_calls())
```

### 2. Análise de Desempenho

Analise o tempo das requisições e identifique recursos lentos:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def analyze_performance():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        
        await tab.go_to('https://example.com')
        await asyncio.sleep(5)
        
        logs = await tab.get_network_logs()
        
        # Armazenar dados de tempo
        timings = []
        
        for log in logs:
            params = log['params']
            request_id = params['requestId']
            url = params['request']['url']
            resource_type = params.get('type', 'Other')
            
            timings.append({
                'url': url,
                'type': resource_type,
                'timestamp': params['timestamp']
            })
        
        # Ordenar por timestamp
        timings.sort(key=lambda x: x['timestamp'])
        
        print("\n⏱️  Linha do Tempo das Requisições:")
        start_time = timings[0]['timestamp'] if timings else 0
        
        for timing in timings[:20]:  # Mostrar as primeiras 20
            elapsed = (timing['timestamp'] - start_time) * 1000  # Converter para ms
            print(f"{elapsed:7.0f}ms | {timing['type']:12} | {timing['url'][:80]}")

asyncio.run(analyze_performance())
```

### 3. Detectando Recursos Externos

Encontre todos os domínios externos aos quais sua página se conecta:

```python
import asyncio
from urllib.parse import urlparse
from collections import Counter
from pydoll.browser.chromium import Chrome

async def analyze_domains():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        
        await tab.go_to('https://news.ycombinator.com')
        await asyncio.sleep(5)
        
        logs = await tab.get_network_logs()
        
        # Contar requisições por domínio
        domains = Counter()
        
        for log in logs:
            url = log['params']['request']['url']
            try:
                domain = urlparse(url).netloc
                if domain:
                    domains[domain] += 1
            except:
                pass
        
        print("\n🌐 Domínios Externos:")
        for domain, count in domains.most_common(10):
            print(f"  {count:3} requisições | {domain}")

asyncio.run(analyze_domains())
```

### 4. Monitorando Tipos Específicos de Recursos

Rastreie tipos específicos de recursos, como imagens ou scripts:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def track_resource_types():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        
        await tab.go_to('https://example.com')
        await asyncio.sleep(3)
        
        logs = await tab.get_network_logs()
        
        # Agrupar por tipo de recurso
        by_type = {}
        
        for log in logs:
            params = log['params']
            resource_type = params.get('type', 'Other')
            url = params['request']['url']
            
            if resource_type not in by_type:
                by_type[resource_type] = []
            
            by_type[resource_type].append(url)
        
        print("\n📦 Recursos por Tipo:")
        for rtype in sorted(by_type.keys()):
            urls = by_type[rtype]
            print(f"\n{rtype}: {len(urls)} recurso(s)")
            for url in urls[:3]:  # Mostrar os 3 primeiros
                print(f"  • {url}")
            if len(urls) > 3:
                print(f"  ... e mais {len(urls) - 3}")

asyncio.run(track_resource_types())
```

## Monitoramento de Rede em Tempo Real

Para monitoramento em tempo real, use callbacks de eventos em vez de consultar `get_network_logs()`:

!!! info "Entendendo Eventos"
    O monitoramento em tempo real usa o sistema de eventos do Pydoll para reagir à atividade de rede assim que ela acontece. Para uma análise profunda de como os eventos funcionam, veja **[Sistema de Eventos](../advanced/event-system.md)**.

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.network.events import (
    NetworkEvent,
    RequestWillBeSentEvent,
    ResponseReceivedEvent,
    LoadingFailedEvent
)

async def real_time_monitoring():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Estatísticas
        stats = {
            'requests': 0,
            'responses': 0,
            'failed': 0
        }
        
        # Callback de requisição
        async def on_request(event: RequestWillBeSentEvent):
            stats['requests'] += 1
            url = event['params']['request']['url']
            method = event['params']['request']['method']
            print(f"→ {method:6} | {url}")
        
        # Callback de resposta
        async def on_response(event: ResponseReceivedEvent):
            stats['responses'] += 1
            response = event['params']['response']
            status = response['status']
            url = response['url']
            
            # Código de cor por status
            if 200 <= status < 300:
                color = '\033[92m'  # Verde
            elif 300 <= status < 400:
                color = '\033[93m'  # Amarelo
            else:
                color = '\033[91m'  # Vermelho
            reset = '\033[0m'
            
            print(f"← {color}{status}{reset} | {url}")
        
        # Callback de falha
        async def on_failed(event: LoadingFailedEvent):
            stats['failed'] += 1
            error = event['params']['errorText']
            print(f"✗ FALHOU: {error}")
        
        # Habilitar e registrar callbacks
        await tab.enable_network_events()
        await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, on_request)
        await tab.on(NetworkEvent.RESPONSE_RECEIVED, on_response)
        await tab.on(NetworkEvent.LOADING_FAILED, on_failed)
        
        # Navegar
        await tab.go_to('https://example.com')
        await asyncio.sleep(5)
        
        print(f"\n📊 Resumo:")
        print(f"  Requisições: {stats['requests']}")
        print(f"  Respostas: {stats['responses']}")
        print(f"  Falhas: {stats['failed']}")

asyncio.run(real_time_monitoring())
```

## Referência de Tipos de Recurso

O Pydoll captura os seguintes tipos de recurso:

| Tipo | Descrição | Exemplos |
|---|---|---|
| `Document` | Documentos HTML principais | Carregamentos de página, fontes de iframe |
| `Stylesheet` | Arquivos CSS | .css externo, estilos inline |
| `Image` | Recursos de imagem | .jpg, .png, .gif, .webp, .svg |
| `Media` | Arquivos de áudio/vídeo | .mp4, .webm, .mp3, .ogg |
| `Font` | Fontes web | .woff, .woff2, .ttf, .otf |
| `Script` | Arquivos JavaScript | Arquivos .js, scripts inline |
| `TextTrack` | Arquivos de legenda | .vtt, .srt |
| `XHR` | XMLHttpRequest | Requisições AJAX, chamadas de API legadas |
| `Fetch` | Requisições da API Fetch | Chamadas de API modernas |
| `EventSource` | Server-Sent Events | Streams em tempo real |
| `WebSocket` | Conexões WebSocket | Comunicação bidirecional |
| `Manifest` | Manifestos de aplicativos web | Configuração de PWA |
| `Other` | Outros tipos de recurso | Diversos |

## Avançado: Extraindo Tempos de Resposta

Eventos de rede incluem informações detalhadas de tempo:

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.network.events import NetworkEvent, ResponseReceivedEvent

async def analyze_timing():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        
        # Callback personalizado para capturar tempos
        timing_data = []
        
        async def on_response(event: ResponseReceivedEvent):
            response = event['params']['response']
            timing = response.get('timing')
            
            if timing:
                # Calcular diferentes fases
                dns_time = timing.get('dnsEnd', 0) - timing.get('dnsStart', 0)
                connect_time = timing.get('connectEnd', 0) - timing.get('connectStart', 0)
                ssl_time = timing.get('sslEnd', 0) - timing.get('sslStart', 0)
                send_time = timing.get('sendEnd', 0) - timing.get('sendStart', 0)
                wait_time = timing.get('receiveHeadersStart', 0) - timing.get('sendEnd', 0)
                receive_time = timing.get('receiveHeadersEnd', 0) - timing.get('receiveHeadersStart', 0)
                
                timing_data.append({
                    'url': response['url'][:50],
                    'dns': dns_time if dns_time > 0 else 0,
                    'connect': connect_time if connect_time > 0 else 0,
                    'ssl': ssl_time if ssl_time > 0 else 0,
                    'send': send_time,
                    'wait': wait_time,
                    'receive': receive_time,
                    'total': receive_time + wait_time + send_time
                })
        
        await tab.on(NetworkEvent.RESPONSE_RECEIVED, on_response)
        await tab.go_to('https://github.com')
        await asyncio.sleep(5)
        
        # Imprimir detalhamento de tempo
        print("\n⏱️  Detalhamento de Tempo da Requisição (ms):")
        print(f"{'URL':<50} | {'DNS':>6} | {'Connect':>8} | {'SSL':>6} | {'Send':>6} | {'Wait':>6} | {'Receive':>8} | {'Total':>7}")
        print("-" * 120)
        
        for data in sorted(timing_data, key=lambda x: x['total'], reverse=True)[:10]:
            print(f"{data['url']:<50} | {data['dns']:6.1f} | {data['connect']:8.1f} | {data['ssl']:6.1f} | "
                  f"{data['send']:6.1f} | {data['wait']:6.1f} | {data['receive']:8.1f} | {data['total']:7.1f}")

asyncio.run(analyze_timing())
```

## Explicação dos Campos de Tempo

| Fase | Campos | Descrição |
|---|---|---|
| **DNS** | `dnsStart` → `dnsEnd` | Tempo de lookup DNS |
| **Connect** | `connectStart` → `connectEnd` | Estabelecimento da conexão TCP |
| **SSL** | `sslStart` → `sslEnd` | Handshake SSL/TLS |
| **Send** | `sendStart` → `sendEnd` | Tempo para enviar a requisição |
| **Wait** | `sendEnd` → `receiveHeadersStart` | Esperando pela resposta do servidor (TTFB) |
| **Receive** | `receiveHeadersStart` → `receiveHeadersEnd` | Tempo para receber os cabeçalhos da resposta |

!!! tip "Time to First Byte (TTFB)"
    TTFB é a fase "Wait" - o tempo entre enviar a requisição e receber o primeiro byte da resposta. Isso é crucial para análise de desempenho.

## Melhores Práticas

### 1. Habilite Eventos de Rede Apenas Quando Necessário

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def best_practice_enable():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # Bom: Habilitar antes da navegação, desabilitar depois
        await tab.enable_network_events()
        await tab.go_to('https://example.com')
        await asyncio.sleep(2)
        logs = await tab.get_network_logs()
        await tab.disable_network_events()
        
        # Ruim: Deixar habilitado durante toda a sessão
        # await tab.enable_network_events()
        # ... longa sessão de automação ...
```

### 2. Filtre Logs para Reduzir o Uso de Memória

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def best_practice_filter():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        await tab.go_to('https://example.com')
        await asyncio.sleep(2)
        
        # Bom: Filtrar por requisições específicas
        api_logs = await tab.get_network_logs(filter='/api/')
        
        # Ruim: Obter todos os logs quando você só precisa de específicos
        all_logs = await tab.get_network_logs()
        filtered = [log for log in all_logs if '/api/' in log['params']['request']['url']]
```

### 3. Acesse Campos Faltantes com Segurança

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def best_practice_safe_access():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        await tab.go_to('https://example.com')
        await asyncio.sleep(2)
        
        logs = await tab.get_network_logs()
        
        # Bom: Acesso seguro com .get()
        for log in logs:
            params = log.get('params', {})
            request = params.get('request', {})
            url = request.get('url', 'Unknown')
            post_data = request.get('postData')  # Pode ser None
            
            if post_data:
                print(f"Dados POST: {post_data}")
        
        # Ruim: Acesso direto pode levantar KeyError
        # url = log['params']['request']['url']
        # post_data = log['params']['request']['postData']  # Pode não existir!
```

### 4. Use Callbacks de Evento para Necessidades em Tempo Real

```python
import asyncio
from pydoll.protocol.network.events import NetworkEvent, RequestWillBeSentEvent

# Bom: Monitoramento em tempo real com callbacks
async def on_request(event: RequestWillBeSentEvent):
    print(f"Nova requisição: {event['params']['request']['url']}")

await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, on_request)

# Ruim: Consultar logs repetidamente (ineficiente)
while True:
    logs = await tab.get_network_logs()
    # Processar logs...
    await asyncio.sleep(0.5)  # Desperdício!
```

## Veja Também

- **[Domínio de Rede CDP](../../deep-dive/network-capabilities.md)** - Análise profunda sobre as capacidades de rede
- **[Sistema de Eventos](../advanced/event-system.md)** - Entendendo a arquitetura de eventos do Pydoll
- **[Interceptação de Requisições](interception.md)** - Modificando requisições e respostas

================================================
FILE: docs/pt/features/network/network-recording.md
================================================
# Gravacao de Rede HAR

Capture toda a atividade de rede durante uma sessao do navegador e exporte como um arquivo HAR (HTTP Archive) 1.2 padrao. Perfeito para depuracao, analise de desempenho e fixtures de teste.

!!! tip "Depure Como um Profissional"
    Arquivos HAR sao o padrao da industria para gravar trafego de rede. Voce pode importa-los diretamente no Chrome DevTools, Charles Proxy ou qualquer visualizador HAR para analise detalhada.

## Por que Usar Gravacao HAR?

| Caso de Uso | Beneficio |
|-------------|-----------|
| Depurar requisicoes com falha | Veja headers exatos, timing e corpos de resposta |
| Analise de desempenho | Identifique requisicoes lentas e gargalos |
| Documentacao de API | Capture pares reais de requisicao/resposta |
| Fixtures de teste | Grave trafego real para mocking em testes |

## Inicio Rapido

Grave todo o trafego de rede durante uma navegacao:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def gravar_trafego():
    async with Chrome() as browser:
        tab = await browser.start()

        async with tab.request.record() as capture:
            await tab.go_to('https://example.com')

        # Salve a captura como arquivo HAR
        capture.save('flow.har')
        print(f'Capturadas {len(capture.entries)} requisicoes')

asyncio.run(gravar_trafego())
```

## API de Gravacao

### `tab.request.record(resource_types=None)`

Gerenciador de contexto que captura o trafego de rede na aba.

| Parametro | Tipo | Descricao |
|-----------|------|-----------|
| `resource_types` | `list[ResourceType] \| None` | Lista opcional de tipos de recurso a capturar. Quando `None` (padrao), todos os tipos sao capturados. |

```python
async with tab.request.record() as capture:
    # Toda atividade de rede dentro deste bloco e capturada
    await tab.go_to('https://example.com')
    await (await tab.find(id='search')).type_text('pydoll')
    await (await tab.find(type='submit')).click()
```

O objeto `capture` (`HarCapture`) fornece:

| Propriedade/Metodo | Descricao |
|-------------------|-----------|
| `capture.entries` | Lista de entradas HAR capturadas |
| `capture.to_dict()` | Dict HAR 1.2 completo (para processamento customizado) |
| `capture.save(path)` | Salvar como arquivo JSON HAR |

### Filtrando por Tipo de Recurso

Grave apenas tipos de recurso especificos ao inves de todo o trafego:

```python
from pydoll.protocol.network.types import ResourceType

# Gravar apenas requisicoes fetch/XHR (ignorar documentos, imagens, etc.)
async with tab.request.record(
    resource_types=[ResourceType.FETCH, ResourceType.XHR]
) as capture:
    await tab.go_to('https://example.com')

# Gravar apenas documentos e folhas de estilo
async with tab.request.record(
    resource_types=[ResourceType.DOCUMENT, ResourceType.STYLESHEET]
) as capture:
    await tab.go_to('https://example.com')
```

Valores disponiveis de `ResourceType`:

| Valor | Descricao |
|-------|-----------|
| `ResourceType.DOCUMENT` | Documentos HTML |
| `ResourceType.STYLESHEET` | Folhas de estilo CSS |
| `ResourceType.SCRIPT` | Arquivos JavaScript |
| `ResourceType.IMAGE` | Imagens |
| `ResourceType.FONT` | Fontes web |
| `ResourceType.MEDIA` | Audio/video |
| `ResourceType.FETCH` | Requisicoes Fetch API |
| `ResourceType.XHR` | Chamadas XMLHttpRequest |
| `ResourceType.WEB_SOCKET` | Conexoes WebSocket |
| `ResourceType.OTHER` | Outros tipos de recurso |

### Salvando Capturas

```python
# Salvar como arquivo HAR (pode ser aberto no Chrome DevTools)
capture.save('flow.har')

# Salvar em diretorio aninhado (criado automaticamente)
capture.save('recordings/session1/flow.har')

# Acessar o dict HAR bruto para processamento customizado
har_dict = capture.to_dict()
print(har_dict['log']['version'])  # "1.2"
```

### Inspecionando Entradas

```python
async with tab.request.record() as capture:
    await tab.go_to('https://example.com')

for entry in capture.entries:
    req = entry['request']
    resp = entry['response']
    print(f"{req['method']} {req['url']} -> {resp['status']}")
```

## Uso Avancado

### Filtrando Entradas Capturadas

```python
async with tab.request.record() as capture:
    await tab.go_to('https://example.com')

# Filtrar apenas chamadas de API
api_entries = [
    e for e in capture.entries
    if '/api/' in e['request']['url']
]

# Filtrar apenas requisicoes com falha
falhas = [
    e for e in capture.entries
    if e['response']['status'] >= 400
]
```

### Processamento HAR Customizado

```python
har = capture.to_dict()

# Contar requisicoes por tipo
from collections import Counter
tipos = Counter(
    e.get('_resourceType', 'Other')
    for e in har['log']['entries']
)
print(tipos)  # Counter({'Document': 1, 'Script': 5, 'Stylesheet': 3, ...})
```

## Formato de Arquivo HAR

O HAR exportado segue a [especificacao HAR 1.2](http://www.softwareishard.com/blog/har-12-spec/). Cada entrada contem:

- **Request**: metodo, URL, headers, parametros de query, dados POST
- **Response**: status, headers, corpo da resposta (texto ou codificado em base64)
- **Timings**: DNS, conexao, SSL, envio, espera (TTFB), recebimento
- **Metadata**: IP do servidor, ID de conexao, tipo de recurso

!!! note "Corpos de Resposta"
    Os corpos de resposta sao capturados automaticamente apos cada requisicao ser concluida. Conteudo binario (imagens, fontes, etc.) e armazenado como strings codificadas em base64.


================================================
FILE: docs/pt/index.md
================================================
<p align="center">
    <img src="../resources/images/logo.png" alt="Pydoll Logo" /> <br><br>
</p>

<p align="center">
    <a href="https://codecov.io/gh/autoscrape-labs/pydoll">
        <img src="https://codecov.io/gh/autoscrape-labs/pydoll/graph/badge.svg?token=40I938OGM9"/>
    </a>
    <img src="https://github.com/thalissonvs/pydoll/actions/workflows/tests.yml/badge.svg" alt="Testes">
    <img src="https://github.com/thalissonvs/pydoll/actions/workflows/ruff-ci.yml/badge.svg" alt="Ruff CI">
    <img src="https://github.com/thalissonvs/pydoll/actions/workflows/release.yml/badge.svg" alt="Release">
    <img src="https://github.com/thalissonvs/pydoll/actions/workflows/mypy.yml/badge.svg" alt="MyPy CI">
</p>


# Bem-vindo ao Pydoll

Olá! Obrigado por conferir o Pydoll, a próxima geração de automação de navegadores para Python. Se você está cansado de lidar com webdrivers e procura uma maneira mais suave e confiável de automatizar navegadores, você está no lugar certo.

## O que é o Pydoll?

O Pydoll está revolucionando a automação de navegadores, **eliminando completamente a necessidade de webdrivers**! Ao contrário de outras soluções que dependem de dependências externas, o Pydoll se conecta diretamente aos navegadores usando o Chrome DevTools Protocol, proporcionando uma experiência de automação perfeita e confiável com desempenho assíncrono nativo.

Seja para extrair dados, [testar aplicativos web](https://www.lambdatest.com/web-testing) ou automatizar tarefas repetitivas, o Pydoll torna tudo surpreendentemente fácil com sua API intuitiva e recursos poderosos. 

## Instalação

Crie e ative um [ambiente virtual](https://docs.python.org/3/tutorial/venv.html) primeiro e, em seguida, instale o Pydoll:

<div class="termy">
```bash
$ pip install pydoll-python

---> 100%
```
</div>

Para a versão de desenvolvimento mais recente, você pode instalar diretamente do GitHub:

```bash
$ pip install git+https://github.com/autoscrape-labs/pydoll.git
```

## Por que escolher o Pydoll?

- **Simplicidade Genuína**: Não queremos que você perca tempo configurando drivers ou lidando com problemas de compatibilidade. Com o Pydoll, você instala e está pronto para automatizar.
- **Interações Verdadeiramente Humanas**: Nossos algoritmos simulam padrões de comportamento humano reais, desde o tempo entre os cliques até a forma como o mouse se move pela tela.
- **Desempenho Assíncrono Nativo**: Construído do zero com `asyncio`, o Pydoll não apenas suporta operações assíncronas, mas foi projetado para elas.
- **Inteligência Integrada**: Bypass automático de captchas Cloudflare Turnstile e reCAPTCHA v3, sem serviços externos ou configurações complexas.
- **Monitoramento de Rede Poderoso**: Intercepte, modifique e analise todo o tráfego de rede com facilidade, dando a você controle total sobre as requisições.
- **Arquitetura Orientada a Eventos**: Reaja a eventos da página, requisições de rede e interações do usuário em tempo real.
- **Localização de Elementos Intuitiva**: Métodos modernos `find()` e `query()` que fazem sentido e funcionam como você esperaria.
- **Segurança de Tipos Robusta**: Sistema de tipos abrangente para melhor suporte da IDE e prevenção de erros.


Pronto para começar? As páginas a seguir guiarão você pela instalação, uso básico e recursos avançados para ajudá-lo a aproveitar ao máximo o Pydoll.

Vamos começar a automatizar a web, da maneira certa! 🚀

## Guia de Início Rápido: Um exemplo simples

Vamos começar com um exemplo prático. O script a seguir abrirá o repositório Pydoll no GitHub e o marcará como favorito:

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def main():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://github.com/autoscrape-labs/pydoll')

        star_button = await tab.find(
            tag_name='button',
            timeout=5,
            raise_exc=False
        )
        if not star_button:
            print("Ops! O botão não foi encontrado.")
            return

        await star_button.click()
        await asyncio.sleep(3)

asyncio.run(main())
```

Este exemplo demonstra como navegar até um site, esperar que um elemento apareça e interagir com ele. Você pode adaptar esse padrão para automatizar diversas tarefas web.

??? note "Ou use sem o gerenciador de contexto..."
    Se preferir não usar o padrão de gerenciador de contexto, você pode gerenciar a instância do navegador manualmente:
    ```python
    import asyncio
    from pydoll.browser.chromium import Chrome

    async def main():
        browser = Chrome()
        tab = await browser.start()
        await tab.go_to('https://github.com/autoscrape-labs/pydoll')

        star_button = await tab.find(
            tag_name='button',
            timeout=5,
            raise_exc=False
        )
        if not star_button:
            print("Ops! O botão não foi encontrado.")
            return

        await star_button.click()
        await asyncio.sleep(3)
        await browser.stop()

    asyncio.run(main())
    ```
    Observe que, ao não usar o gerenciador de contexto, você precisará chamar explicitamente `browser.stop()` para liberar os recursos.


## Exemplo Estendido: Configuração personalizada do navegador

Para cenários de uso mais avançados, o Pydoll permite personalizar a configuração do seu navegador usando a classe `ChromiumOptions`. Isso é útil quando você precisa:

- Executar em modo headless (sem janela do navegador visível)
- Especificar um caminho personalizado para o executável do navegador
- Configurar proxies, user agents ou outras configurações do navegador
- Definir as dimensões da janela ou argumentos de inicialização

Aqui está um exemplo mostrando como usar opções personalizadas para o Chrome:

```python hl_lines="8-12 30-32 34-38"
import asyncio
import os
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def main():
    options = ChromiumOptions()
    options.binary_location = '/usr/bin/google-chrome-stable'
    options.add_argument('--headless=new')
    options.add_argument('--start-maximized')
    options.add_argument('--disable-notifications')

    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://github.com/autoscrape-labs/pydoll')

        star_button = await tab.find(
            tag_name='button',
            timeout=5,
            raise_exc=False
        )
        if not star_button:
            print("Ops! O botão não foi encontrado.")
            return

        await star_button.click()
        await asyncio.sleep(3)

        screenshot_path = os.path.join(os.getcwd(), 'pydoll_repo.png')
        await tab.take_screenshot(path=screenshot_path)
        print(f"Captura de tela salva em: {screenshot_path}")

        base64_screenshot = await tab.take_screenshot(as_base64=True)

        repo_description_element = await tab.find(
            class_name='f4.my-3'
        )
        repo_description = await repo_description_element.text
        print(f"Descrição do repositório: {repo_description}")

if __name__ == "__main__":
    asyncio.run(main())
```

Este exemplo estendido demonstra:

1. Criação e configuração de opções do navegador
2. Definição de um caminho personalizado para o binário do Chrome
3. Habilitação do modo headless para operação invisível
4. Definição de sinalizadores adicionais do navegador
5. Captura de tela (especialmente útil em modo headless) modo)

??? info "Sobre as Opções do Chromium"
    O método `options.add_argument()` permite que você passe qualquer argumento de linha de comando do Chromium para personalizar o comportamento do navegador. Existem centenas de opções disponíveis para controlar tudo, desde rede até comportamento de renderização. 

    Opções comuns do Chrome

    ```python
    # Opções de Desempenho e Comportamento
    options.add_argument('--headless=new')         # Executar o Chrome em modo headless
    options.add_argument('--disable-gpu')          # Desabilitar a aceleração de hardware da GPU
    options.add_argument('--no-sandbox')           # Desabilitar o sandbox (use com cuidado)
    options.add_argument('--disable-dev-shm-usage') # Superar problemas de recursos limitados

    # Opções de Aparência
    options.add_argument('--start-maximized')      # Iniciar com a janela maximizada
    options.add_argument('--window-size=1920,1080') # Definir tamanho específico da janela
    options.add_argument('--hide-scrollbars')      # Ocultar barras de rolagem

    # Opções de Rede
    options.add_argument('--proxy-server=socks5://127.0.0.1:9050') # Usar proxy
    options.add_argument('--disable-extensions')   # Desabilitar extensões
    options.add_argument('--disable-notifications') # Desabilitar notificações

    # Privacidade e Segurança
    options.add_argument('--incognito')            # Executar em modo anônimo
    options.add_argument('--disable-infobars')     # Desabilitar barras de informações
    ```

    Guias de Referência Completos

    Para obter uma lista completa de todos os argumentos de linha de comando do Chrome disponíveis, consulte estes recursos:

    - [Opções de Linha de Comando do Chromium](https://peter.sh/experiments/chromium-command-line-switches/) - Lista de referência completa
    - [Flags do Chrome](chrome://flags) - Digite isso na barra de endereço do seu navegador Chrome para ver os recursos experimentais
    - [Flags do Código-Fonte do Chromium](https://source.chromium.org/chromium/chromium/src/+/main:chrome/common/chrome_switches.cc) - Referência direta ao código-fonte

    Lembre-se de que algumas opções podem se comportar de maneira diferente em diferentes versões do Chrome, portanto, é uma boa prática testar sua configuração ao atualizar o Chrome. 

Com essas configurações, você pode executar o Pydoll em diversos ambientes, incluindo pipelines de CI/CD, servidores sem interface gráfica ou contêineres Docker.

Continue lendo a documentação para explorar os recursos poderosos do Pydoll para lidar com captchas, trabalhar com várias abas, interagir com elementos e muito mais.

## Dependências Mínimas

Uma das vantagens do Pydoll é sua leveza. Ao contrário de outras ferramentas de automação de navegador que exigem inúmeras dependências, o Pydoll foi projetado intencionalmente para ser minimalista, mantendo recursos poderosos.

### Dependências Principais

O Pydoll depende de apenas alguns pacotes cuidadosamente selecionados:

```
python = "^3.10"
websockets = "^13.1"
aiohttp = "^3.9.5"
aiofiles = "^23.2.1"
bs4 = "^0.0.2"
```

É só isso! Essa dependência mínima do Pydoll significa:

- **Instalação mais rápida** - Sem árvore de dependências complexa para resolver
- **Menos conflitos** - Menor chance de conflitos de versão com outros pacotes
- **Menor consumo de recursos** - Menor uso de espaço em disco
- **Melhor segurança** - Menor superfície de ataque e vulnerabilidades relacionadas a dependências
- **Atualizações mais fáceis** - Manutenção mais simples e menos alterações que quebram a compatibilidade

O pequeno número de dependências também contribui para a confiabilidade e o desempenho do Pydoll, pois há menos fatores externos que podem impactar seu funcionamento.

## Top Sponsors

<a href="https://substack.thewebscraping.club/p/pydoll-webdriver-scraping?utm_source=github&utm_medium=repo&utm_campaign=pydoll" target="_blank" rel="noopener nofollow sponsored">
  <img src="../resources/images/banner-the-webscraping-club.png" alt="The Web Scraping Club" />
</a>

<sub>Leia uma review completa do Pydoll no <b><a href="https://substack.thewebscraping.club/p/pydoll-webdriver-scraping?utm_source=github&utm_medium=repo&utm_campaign=pydoll" target="_blank" rel="noopener nofollow sponsored">The Web Scraping Club</a></b>, a newsletter #1 dedicada a web scraping.</sub>

## Patrocinadores

O apoio dos patrocinadores é essencial para manter o projeto vivo, em constante evolução e acessível a toda a comunidade. Cada parceria ajuda a cobrir custos, impulsionar novos recursos e garantir o desenvolvimento contínuo. Somos muito gratos a todos que acreditam e apoiam o projeto!

<div class="sponsors-grid">
  <a href="https://www.thordata.com/?ls=github&lk=pydoll" target="_blank" rel="noopener nofollow sponsored">
    <img src="../resources/images/Thordata-logo.png" alt="Thordata" />
  </a>
  <a href="https://www.testmuai.com/?utm_medium=sponsor&utm_source=pydoll" target="_blank" rel="noopener nofollow sponsored">
    <img src="../resources/images/logo-lamda-test.svg" alt="LambdaTest" />
  </a>
  <a href="https://dashboard.capsolver.com/passport/register?inviteCode=WPhTbOsbXEpc" target="_blank" rel="noopener nofollow sponsored">
    <img src="../resources/images/capsolver-logo.png" alt="CapSolver" />
  </a>
</div>

<p>
  <a href="https://github.com/sponsors/thalissonvs" target="_blank" rel="noopener">Seja um patrocinador</a>
</p>


## Licença

O Pydoll é lançado sob a Licença MIT, que lhe dá a liberdade de usar, modificar e distribuir o código com restrições mínimas. Esta licença permissiva torna o Pydoll adequado para projetos pessoais e comerciais.

??? info "Ver o texto completo da Licença MIT"
    ```
    MIT License
    
    Copyright (c) 2023 Pydoll Contributors
    
    Permission is hereby granted, free of charge, to any person obtaining a copy
    of this software and associated documentation files (the "Software"), to deal
    in the Software without restriction, including without limitation the rights
    to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
    copies of the Software, and to permit persons to whom the Software is
    furnished to do so, subject to the following conditions:
    
    The above copyright notice and this permission notice shall be included in all
    copies or substantial portions of the Software.
    
    THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
    IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
    FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
    AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
    LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
    OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
    SOFTWARE.
    ```

================================================
FILE: docs/resources/scripts/extra.js
================================================
function setupTermynal() {
    document.querySelectorAll(".use-termynal").forEach(node => {
        node.style.display = "block";
        new Termynal(node, {
            lineDelay: 500
        });
    });
    const progressLiteralStart = "---> 100%";
    const promptLiteralStart = "$ ";
    const customPromptLiteralStart = "# ";
    const termynalActivateClass = "termy";
    let termynals = [];

    function createTermynals() {
        document
            .querySelectorAll(`.${termynalActivateClass} .highlight code`)
            .forEach(node => {
                const text = node.textContent;
                const lines = text.split("\n");
                const useLines = [];
                let buffer = [];
                function saveBuffer() {
                    if (buffer.length) {
                        let isBlankSpace = true;
                        buffer.forEach(line => {
                            if (line) {
                                isBlankSpace = false;
                            }
                        });
                        dataValue = {};
                        if (isBlankSpace) {
                            dataValue["delay"] = 0;
                        }
                        if (buffer[buffer.length - 1] === "") {
                            // A last single <br> won't have effect
                            // so put an additional one
                            buffer.push("");
                        }
                        const bufferValue = buffer.join("<br>");
                        dataValue["value"] = bufferValue;
                        useLines.push(dataValue);
                        buffer = [];
                    }
                }
                for (let line of lines) {
                    if (line === progressLiteralStart) {
                        saveBuffer();
                        useLines.push({
                            type: "progress"
                        });
                    } else if (line.startsWith(promptLiteralStart)) {
                        saveBuffer();
                        const value = line.replace(promptLiteralStart, "").trimEnd();
                        useLines.push({
                            type: "input",
                            value: value
                        });
                    } else if (line.startsWith("// ")) {
                        saveBuffer();
                        const value = "💬 " + line.replace("// ", "").trimEnd();
                        useLines.push({
                            value: value,
                            class: "termynal-comment",
                            delay: 0
                        });
                    } else if (line.startsWith(customPromptLiteralStart)) {
                        saveBuffer();
                        const promptStart = line.indexOf(promptLiteralStart);
                        if (promptStart === -1) {
                            console.error("Custom prompt found but no end delimiter", line)
                        }
                        const prompt = line.slice(0, promptStart).replace(customPromptLiteralStart, "")
                        let value = line.slice(promptStart + promptLiteralStart.length);
                        useLines.push({
                            type: "input",
                            value: value,
                            prompt: prompt
                        });
                    } else {
                        buffer.push(line);
                    }
                }
                saveBuffer();
                const div = document.createElement("div");
                node.replaceWith(div);
                const termynal = new Termynal(div, {
                    lineData: useLines,
                    noInit: true,
                    lineDelay: 500
                });
                termynals.push(termynal);
            });
    }

    function loadVisibleTermynals() {
        termynals = termynals.filter(termynal => {
            if (termynal.container.getBoundingClientRect().top - innerHeight <= 0) {
                termynal.init();
                return false;
            }
            return true;
        });
    }
    window.addEventListener("scroll", loadVisibleTermynals);
    createTermynals();
    loadVisibleTermynals();
}

function shuffle(array) {
    var currentIndex = array.length, temporaryValue, randomIndex;
    while (0 !== currentIndex) {
        randomIndex = Math.floor(Math.random() * currentIndex);
        currentIndex -= 1;
        temporaryValue = array[currentIndex];
        array[currentIndex] = array[randomIndex];
        array[randomIndex] = temporaryValue;
    }
    return array;
}

async function showRandomAnnouncement(groupId, timeInterval) {
    const announceFastAPI = document.getElementById(groupId);
    if (announceFastAPI) {
        let children = [].slice.call(announceFastAPI.children);
        children = shuffle(children)
        let index = 0
        const announceRandom = () => {
            children.forEach((el, i) => { el.style.display = "none" });
            children[index].style.display = "block"
            index = (index + 1) % children.length
        }
        announceRandom()
        setInterval(announceRandom, timeInterval
        )
    }
}

async function main() {
    setupTermynal();
    showRandomAnnouncement('announce-left', 5000)
    showRandomAnnouncement('announce-right', 10000)
}
document$.subscribe(() => {
    main()
})

================================================
FILE: docs/resources/scripts/termynal.js
================================================
/**
 * termynal.js
 * A lightweight, modern and extensible animated terminal window, using
 * async/await.
 *
 * @author Ines Montani <ines@ines.io>
 * @version 0.0.1
 * @license MIT
 */

'use strict';

/** Generate a terminal widget. */
class Termynal {
    /**
     * Construct the widget's settings.
     * @param {(string|Node)=} container - Query selector or container element.
     * @param {Object=} options - Custom settings.
     * @param {string} options.prefix - Prefix to use for data attributes.
     * @param {number} options.startDelay - Delay before animation, in ms.
     * @param {number} options.typeDelay - Delay between each typed character, in ms.
     * @param {number} options.lineDelay - Delay between each line, in ms.
     * @param {number} options.progressLength - Number of characters displayed as progress bar.
     * @param {string} options.progressChar – Character to use for progress bar, defaults to █.
	 * @param {number} options.progressPercent - Max percent of progress.
     * @param {string} options.cursor – Character to use for cursor, defaults to ▋.
     * @param {Object[]} lineData - Dynamically loaded line data objects.
     * @param {boolean} options.noInit - Don't initialise the animation.
     */
    constructor(container = '#termynal', options = {}) {
        this.container = (typeof container === 'string') ? document.querySelector(container) : container;
        this.pfx = `data-${options.prefix || 'ty'}`;
        this.originalStartDelay = this.startDelay = options.startDelay
            || parseFloat(this.container.getAttribute(`${this.pfx}-startDelay`)) || 600;
        this.originalTypeDelay = this.typeDelay = options.typeDelay
            || parseFloat(this.container.getAttribute(`${this.pfx}-typeDelay`)) || 90;
        this.originalLineDelay = this.lineDelay = options.lineDelay
            || parseFloat(this.container.getAttribute(`${this.pfx}-lineDelay`)) || 1500;
        this.progressLength = options.progressLength
            || parseFloat(this.container.getAttribute(`${this.pfx}-progressLength`)) || 40;
        this.progressChar = options.progressChar
            || this.container.getAttribute(`${this.pfx}-progressChar`) || '█';
		this.progressPercent = options.progressPercent
            || parseFloat(this.container.getAttribute(`${this.pfx}-progressPercent`)) || 100;
        this.cursor = options.cursor
            || this.container.getAttribute(`${this.pfx}-cursor`) || '▋';
        this.lineData = this.lineDataToElements(options.lineData || []);
        this.loadLines()
        if (!options.noInit) this.init()
    }

    loadLines() {
        // Load all the lines and create the container so that the size is fixed
        // Otherwise it would be changing and the user viewport would be constantly
        // moving as she/he scrolls
        const finish = this.generateFinish()
        finish.style.visibility = 'hidden'
        this.container.appendChild(finish)
        // Appends dynamically loaded lines to existing line elements.
        this.lines = [...this.container.querySelectorAll(`[${this.pfx}]`)].concat(this.lineData);
        for (let line of this.lines) {
            line.style.visibility = 'hidden'
            this.container.appendChild(line)
        }
        const restart = this.generateRestart()
        restart.style.visibility = 'hidden'
        this.container.appendChild(restart)
        this.container.setAttribute('data-termynal', '');
    }

    /**
     * Initialise the widget, get lines, clear container and start animation.
     */
    init() {
        /**
         * Calculates width and height of Termynal container.
         * If container is empty and lines are dynamically loaded, defaults to browser `auto` or CSS.
         */
        const containerStyle = getComputedStyle(this.container);
        this.container.style.width = containerStyle.width !== '0px' ?
            containerStyle.width : undefined;
        this.container.style.minHeight = containerStyle.height !== '0px' ?
            containerStyle.height : undefined;

        this.container.setAttribute('data-termynal', '');
        this.container.innerHTML = '';
        for (let line of this.lines) {
            line.style.visibility = 'visible'
        }
        this.start();
    }

    /**
     * Start the animation and rener the lines depending on their data attributes.
     */
    async start() {
        this.addFinish()
        await this._wait(this.startDelay);

        for (let line of this.lines) {
            const type = line.getAttribute(this.pfx);
            const delay = line.getAttribute(`${this.pfx}-delay`) || this.lineDelay;

            if (type == 'input') {
                line.setAttribute(`${this.pfx}-cursor`, this.cursor);
                await this.type(line);
                await this._wait(delay);
            }

            else if (type == 'progress') {
                await this.progress(line);
                await this._wait(delay);
            }

            else {
                this.container.appendChild(line);
                await this._wait(delay);
            }

            line.removeAttribute(`${this.pfx}-cursor`);
        }
        this.addRestart()
        this.finishElement.style.visibility = 'hidden'
        this.lineDelay = this.originalLineDelay
        this.typeDelay = this.originalTypeDelay
        this.startDelay = this.originalStartDelay
    }

    generateRestart() {
        const restart = document.createElement('a')
        restart.onclick = (e) => {
            e.preventDefault()
            this.container.innerHTML = ''
            this.init()
        }
        restart.href = '#'
        restart.setAttribute('data-terminal-control', '')
        restart.innerHTML = "restart ↻"
        return restart
    }

    generateFinish() {
        const finish = document.createElement('a')
        finish.onclick = (e) => {
            e.preventDefault()
            this.lineDelay = 0
            this.typeDelay = 0
            this.startDelay = 0
        }
        finish.href = '#'
        finish.setAttribute('data-terminal-control', '')
        finish.innerHTML = "fast →"
        this.finishElement = finish
        return finish
    }

    addRestart() {
        const restart = this.generateRestart()
        this.container.appendChild(restart)
    }

    addFinish() {
        const finish = this.generateFinish()
        this.container.appendChild(finish)
    }

    /**
     * Animate a typed line.
     * @param {Node} line - The line element to render.
     */
    async type(line) {
        const chars = [...line.textContent];
        line.textContent = '';
        this.container.appendChild(line);

        for (let char of chars) {
            const delay = line.getAttribute(`${this.pfx}-typeDelay`) || this.typeDelay;
            await this._wait(delay);
            line.textContent += char;
        }
    }

    /**
     * Animate a progress bar.
     * @param {Node} line - The line element to render.
     */
    async progress(line) {
        const progressLength = line.getAttribute(`${this.pfx}-progressLength`)
            || this.progressLength;
        const progressChar = line.getAttribute(`${this.pfx}-progressChar`)
            || this.progressChar;
        const chars = progressChar.repeat(progressLength);
		const progressPercent = line.getAttribute(`${this.pfx}-progressPercent`)
			|| this.progressPercent;
        line.textContent = '';
        this.container.appendChild(line);

        for (let i = 1; i < chars.length + 1; i++) {
            await this._wait(this.typeDelay);
            const percent = Math.round(i / chars.length * 100);
            line.textContent = `${chars.slice(0, i)} ${percent}%`;
			if (percent>progressPercent) {
				break;
			}
        }
    }

    /**
     * Helper function for animation delays, called with `await`.
     * @param {number} time - Timeout, in ms.
     */
    _wait(time) {
        return new Promise(resolve => setTimeout(resolve, time));
    }

    /**
     * Converts line data objects into line elements.
     *
     * @param {Object[]} lineData - Dynamically loaded lines.
     * @param {Object} line - Line data object.
     * @returns {Element[]} - Array of line elements.
     */
    lineDataToElements(lineData) {
        return lineData.map(line => {
            let div = document.createElement('div');
            div.innerHTML = `<span ${this._attributes(line)}>${line.value || ''}</span>`;

            return div.firstElementChild;
        });
    }

    /**
     * Helper function for generating attributes string.
     *
     * @param {Object} line - Line data object.
     * @returns {string} - String of attributes.
     */
    _attributes(line) {
        let attrs = '';
        for (let prop in line) {
            // Custom add class
            if (prop === 'class') {
                attrs += ` class=${line[prop]} `
                continue
            }
            if (prop === 'type') {
                attrs += `${this.pfx}="${line[prop]}" `
            } else if (prop !== 'value') {
                attrs += `${this.pfx}-${prop}="${line[prop]}" `
            }
        }

        return attrs;
    }
}

/**
* HTML API: If current script has container(s) specified, initialise Termynal.
*/
if (document.currentScript.hasAttribute('data-termynal-container')) {
    const containers = document.currentScript.getAttribute('data-termynal-container');
    containers.split('|')
        .forEach(container => new Termynal(container))
}

================================================
FILE: docs/resources/stylesheets/extra.css
================================================
.termynal-comment {
  color: #4a968f;
  font-style: italic;
  display: block;
}

.termy {
  /* For right to left languages */
  direction: ltr;
}

.termy [data-termynal] {
  white-space: pre-wrap;
}

.termy .linenos {
  display: none;
}

.label-class {
  background-color: #1e88e5;
  color: white;
  padding: 2px 6px;
  font-size: 0.75em;
  border-radius: 4px;
  font-family: monospace;
}

.label-attr {
  background-color: #fb8c00;
  color: white;
  padding: 2px 6px;
  font-size: 0.75em;
  border-radius: 4px;
  font-family: monospace;
}

.label-meth {
  background-color: #43a047;
  color: white;
  padding: 2px 6px;
  font-size: 0.75em;
  border-radius: 4px;
  font-family: monospace;
}


[data-md-color-scheme="default"] {
  --md-primary-fg-color:        #0D141C;
  --md-primary-fg-color--light: #3a7e9d;
  --md-primary-fg-color--dark:  #004059;
  
  --md-accent-fg-color: #0091d0;
  --md-accent-bg-color: rgba(0, 145, 208, 0.1);
  
  /* Background color personalizado */
  --md-default-bg-color: #E2ECED;
}

[data-md-color-scheme="slate"] {
  --md-primary-fg-color:        #2b1d43;
  --md-primary-fg-color--light: #b4b7bc;
  --md-primary-fg-color--dark:  #2b1d43;

  --md-accent-fg-color: #8caabf;
  --md-accent-bg-color: rgba(140, 170, 191, 0.1);
  
  --md-default-bg-color: #0D141C;
  --md-default-fg-color: #ffffff;
}


[data-md-color-scheme="slate"] .md-content h3 a,
[data-md-color-scheme="slate"] .md-content h2 a,
[data-md-color-scheme="slate"] .md-content h1 a {
  color: inherit !important;
  text-decoration: none;
}

[data-md-color-scheme="slate"] .md-content h3 a:hover,
[data-md-color-scheme="slate"] .md-content h2 a:hover,
[data-md-color-scheme="slate"] .md-content h1 a:hover {
  text-decoration: underline;
  opacity: 0.8;
}

/* Corrigir links dentro de cabeçalhos no modo claro */
[data-md-color-scheme="default"] .md-content h3 a,
[data-md-color-scheme="default"] .md-content h2 a,
[data-md-color-scheme="default"] .md-content h1 a {
  color: inherit !important; /* Herdar a cor do cabeçalho pai */
  text-decoration: none;
}

[data-md-color-scheme="default"] .md-content h3 a:hover,
[data-md-color-scheme="default"] .md-content h2 a:hover,
[data-md-color-scheme="default"] .md-content h1 a:hover {
  text-decoration: underline;
  opacity: 0.8;
}

/* Estilo básico para links ativos - modo claro */
.md-nav__link--active {
  font-weight: bold;
  color: var(--md-accent-fg-color);
}

/* Sobrescrever cor apenas para o modo escuro */
[data-md-color-scheme="slate"] .md-nav__link--active {
  color: #b4c0dd; /* Cor clara para contraste no modo escuro */
}

/* Logo personalizado */
.md-header__button.md-logo img,
.md-header__button.md-logo svg {
  display: none;
}

.md-header__button.md-logo {
  background-image: url('../images/logo.png');
  background-size: contain;
  background-repeat: no-repeat;
  background-position: center;
  width: 100px;
  height: 50px;
}

.md-header__button.md-logo:before {
  content: '';
  display: block;
  width: 100%;
  height: 100%;
}

/* Ocultar o nome do site no cabeçalho */
.md-header__topic {
  display: none;
}

/* Logo automático baseado no tema para a página index */
/* Ocultar todas as imagens de logo por padrão */
.md-content img[alt="Pydoll Logo"] {
  display: none;
}

/* Modo claro - mostrar logo roxo */
[data-md-color-scheme="default"] .md-content img[alt="Pydoll Logo"] {
  display: block;
  content: url('../images/logo-black.png');
}

/* Modo escuro - mostrar logo cinza */
[data-md-color-scheme="slate"] .md-content img[alt="Pydoll Logo"] {
  display: block;
  content: url('../images/logo.png');
}

/* ===== SPONSORS GRID ===== */

.md-typeset .sponsors-grid {
  display: flex;
  flex-wrap: wrap;
  align-items: center;
  gap: 24px;
  margin: 16px 0;
}

.md-typeset .sponsors-grid img {
  max-width: none !important;
  height: auto !important;
}

.md-typeset .sponsors-grid img[alt="Thordata"] {
  height: 40px !important;
}

.md-typeset .sponsors-grid img[alt="LambdaTest"] {
  height: 40px !important;
  width: 160px !important;
}

.md-typeset .sponsors-grid img[alt="CapSolver"] {
  height: 60px !important;
}

/* ===== MELHORIAS DE LINKS PARA MODO ESCURO ===== */

/* Links gerais no conteúdo - modo escuro */
[data-md-color-scheme="slate"] .md-content a {
  color: #64b5f6 !important; /* Azul claro para boa visibilidade */
  text-decoration: none;
}

[data-md-color-scheme="slate"] .md-content a:hover {
  color: #90caf9 !important; /* Azul mais claro no hover */
  text-decoration: underline;
}

/* Links na navegação lateral - modo escuro */
[data-md-color-scheme="slate"] .md-nav__link {
  color: #e0e0e0 !important; /* Cinza claro para links normais */
}

[data-md-color-scheme="slate"] .md-nav__link:hover {
  color: #ffffff !important; /* Branco no hover */
}

[data-md-color-scheme="slate"] .md-nav__link--active {
  color: #90caf9 !important; /* Verde claro para link ativo */
  font-weight: bold;
}

/* Links em tabelas - modo escuro */
[data-md-color-scheme="slate"] .md-typeset table a {
  color: #64b5f6 !important;
}

[data-md-color-scheme="slate"] .md-typeset table a:hover {
  color: #90caf9 !important;
}

/* Links em listas - modo escuro */
[data-md-color-scheme="slate"] .md-typeset ul a,
[data-md-color-scheme="slate"] .md-typeset ol a {
  color: #64b5f6 !important;
}

[data-md-color-scheme="slate"] .md-typeset ul a:hover,
[data-md-color-scheme="slate"] .md-typeset ol a:hover {
  color: #90caf9 !important;
}

/* Links em admonitions (caixas de aviso) - modo escuro */
[data-md-color-scheme="slate"] .md-typeset .admonition a {
  color: #64b5f6 !important;
}

[data-md-color-scheme="slate"] .md-typeset .admonition a:hover {
  color: #90caf9 !important;
}

/* ===== MELHORIAS DE LINKS PARA MODO CLARO ===== */

/* Links gerais no conteúdo - modo claro */
[data-md-color-scheme="default"] .md-content a {
  color: #1976d2 !important; /* Azul escuro para boa visibilidade */
  text-decoration: none;
}

[data-md-color-scheme="default"] .md-content a:hover {
  color: #1565c0 !important; /* Azul mais escuro no hover */
  text-decoration: underline;
}

/* Links na navegação lateral - modo claro */
[data-md-color-scheme="default"] .md-nav__link {
  color: #424242 !important; /* Cinza escuro para links normais */
}

[data-md-color-scheme="default"] .md-nav__link:hover {
  color: #1976d2 !important; /* Azul no hover */
}

[data-md-color-scheme="default"] .md-nav__link--active {
  color: #2e7d32 !important; /* Verde escuro para link ativo */
  font-weight: bold;
}

/* Links em tabelas - modo claro */
[data-md-color-scheme="default"] .md-typeset table a {
  color: #1976d2 !important;
}

[data-md-color-scheme="default"] .md-typeset table a:hover {
  color: #1565c0 !important;
}


================================================
FILE: docs/resources/stylesheets/termynal.css
================================================
/**
 * termynal.js
 *
 * @author Ines Montani <ines@ines.io>
 * @version 0.0.1
 * @license MIT
 */

 :root {
    --color-bg: #252a33;
    --color-text: #eee;
    --color-text-subtle: #a2a2a2;
}

[data-termynal] {
    width: 750px;
    max-width: 100%;
    background: var(--color-bg);
    color: var(--color-text);
    /* font-size: 18px; */
    font-size: 15px;
    /* font-family: 'Fira Mono', Consolas, Menlo, Monaco, 'Courier New', Courier, monospace; */
    font-family: 'Roboto Mono', 'Fira Mono', Consolas, Menlo, Monaco, 'Courier New', Courier, monospace;
    border-radius: 4px;
    padding: 75px 45px 35px;
    position: relative;
    -webkit-box-sizing: border-box;
            box-sizing: border-box;
    /* Custom line-height */
    line-height: 1.2;
}

[data-termynal]:before {
    content: '';
    position: absolute;
    top: 15px;
    left: 15px;
    display: inline-block;
    width: 15px;
    height: 15px;
    border-radius: 50%;
    /* A little hack to display the window buttons in one pseudo element. */
    background: #d9515d;
    -webkit-box-shadow: 25px 0 0 #f4c025, 50px 0 0 #3ec930;
            box-shadow: 25px 0 0 #f4c025, 50px 0 0 #3ec930;
}

[data-termynal]:after {
    content: 'bash';
    position: absolute;
    color: var(--color-text-subtle);
    top: 5px;
    left: 0;
    width: 100%;
    text-align: center;
}

a[data-terminal-control] {
    text-align: right;
    display: block;
    color: #aebbff;
}

[data-ty] {
    display: block;
    line-height: 2;
}

[data-ty]:before {
    /* Set up defaults and ensure empty lines are displayed. */
    content: '';
    display: inline-block;
    vertical-align: middle;
}

[data-ty="input"]:before,
[data-ty-prompt]:before {
    margin-right: 0.75em;
    color: var(--color-text-subtle);
}

[data-ty="input"]:before {
    content: '$';
}

[data-ty][data-ty-prompt]:before {
    content: attr(data-ty-prompt);
}

[data-ty-cursor]:after {
    content: attr(data-ty-cursor);
    font-family: monospace;
    margin-left: 0.5em;
    -webkit-animation: blink 1s infinite;
            animation: blink 1s infinite;
}


/* Cursor animation */

@-webkit-keyframes blink {
    50% {
        opacity: 0;
    }
}

@keyframes blink {
    50% {
        opacity: 0;
    }
}

================================================
FILE: docs/zh/api/browser/chrome.md
================================================
# Chrome Browser
 
::: pydoll.browser.chromium.Chrome
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2 

================================================
FILE: docs/zh/api/browser/edge.md
================================================
# Edge Browser
 
::: pydoll.browser.chromium.Edge
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2 

================================================
FILE: docs/zh/api/browser/managers.md
================================================
# 浏览器管理器

管理器模块提供专门的类来管理浏览器生命周期和配置。

## 总览

Browser managers handle specific responsibilities in browser automation:

::: pydoll.browser.managers
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## 管理器类

### 浏览器进程管理器
管理浏览器进程的生命周期，包括启动、停止和监控浏览器进程。

::: pydoll.browser.managers.browser_process_manager
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3

### 浏览器选项管理器
处理浏览器配置选项和命令行参数。

::: pydoll.browser.managers.browser_options_manager
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3

### 代理管理器
管理浏览器实例的代理配置和身份验证。

::: pydoll.browser.managers.proxy_manager
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3

### 临时目录管理器
处理浏览器实例使用的临时目录的创建和清理。

::: pydoll.browser.managers.temp_dir_manager
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3

## 用法
管理器通常由 Chrome 和 Edge 等浏览器类内部使用。它们提供可组合的模块化功能：

```python
from pydoll.browser.managers.proxy_manager import ProxyManager
from pydoll.browser.managers.temp_dir_manager import TempDirManager

# Managers are used internally by browser classes
# Direct usage is for advanced scenarios only
proxy_manager = ProxyManager()
temp_manager = TempDirManager()
```

!!! note "Internal Usage"
    These managers are primarily used internally by the browser classes. Direct usage is recommended only for advanced scenarios or when extending the library. 

================================================
FILE: docs/zh/api/browser/options.md
================================================
# Browser Options

## ChromiumOptions

::: pydoll.browser.options.ChromiumOptions
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3

## Options Interface

::: pydoll.browser.interfaces.Options
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3

## BrowserOptionsManager Interface

::: pydoll.browser.interfaces.BrowserOptionsManager
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3 

================================================
FILE: docs/zh/api/browser/requests.md
================================================
# 浏览器请求

请求模块在浏览器上下文中提供 HTTP 请求功能，支持继承浏览器会话状态、cookies 和身份验证的无缝 API 调用。

## 概述

浏览器请求模块为在浏览器 JavaScript 上下文中直接进行 HTTP 调用提供了类似 `requests` 的接口。这种方法相比传统 HTTP 库提供了几个优势：

- **会话继承**: 自动处理 cookie、身份验证和 CORS
- **浏览器上下文**: 请求在与页面相同的安全上下文中执行
- **无需会话管理**: 消除在自动化和 API 调用之间传输 cookies 和令牌的需要
- **SPA 兼容性**: 完美适配具有复杂身份验证流程的单页应用

## Request 类

在浏览器上下文中进行 HTTP 请求的主要接口。

::: pydoll.browser.requests.request.Request
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3
      group_by_category: true
      members_order: source
      filters:
        - "!^__"

## Response 类

表示 HTTP 请求的响应，提供类似于 `requests` 库的熟悉接口。

::: pydoll.browser.requests.response.Response
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3
      group_by_category: true
      members_order: source
      filters:
        - "!^__"

## 使用示例

### 基本 HTTP 方法

```python
from pydoll.browser.chromium import Chrome

async with Chrome() as browser:
    tab = await browser.start()
    await tab.go_to("https://api.example.com")
    
    # GET 请求
    response = await tab.request.get("/users/123")
    user_data = await response.json()
    
    # POST 请求
    response = await tab.request.post("/users", json={
        "name": "John Doe",
        "email": "john@example.com"
    })
    
    # 带 headers 的 PUT 请求
    response = await tab.request.put("/users/123", 
        json={"name": "Jane Doe"},
        headers={"Authorization": "Bearer token123"}
    )
```

### 响应处理

```python
# 检查响应状态
if response.ok:
    print(f"成功: {response.status_code}")
else:
    print(f"错误: {response.status_code}")
    response.raise_for_status()  # 对 4xx/5xx 抛出 HTTPError

# 访问响应数据
text_data = response.text
json_data = await response.json()
raw_bytes = response.content

# 检查 headers 和 cookies
print("响应 headers:", response.headers)
print("请求 headers:", response.request_headers)
for cookie in response.cookies:
    print(f"Cookie: {cookie.name}={cookie.value}")
```

### 高级功能

```python
# 带自定义 headers 和参数的请求
response = await tab.request.get("/search", 
    params={"q": "python", "limit": 10},
    headers={
        "User-Agent": "Custom Bot 1.0",
        "Accept": "application/json"
    }
)

# 文件上传模拟
response = await tab.request.post("/upload",
    data={"description": "Test file"},
    files={"file": ("test.txt", "file content", "text/plain")}
)

# 表单数据提交
response = await tab.request.post("/login",
    data={"username": "user", "password": "pass"}
)
```

## 与 Tab 的集成

请求功能通过 `tab.request` 属性访问，该属性为每个 tab 提供一个单例 `Request` 实例：

```python
# 每个 tab 都有自己的 request 实例
tab1 = await browser.get_tab(0)
tab2 = await browser.new_tab()

# 这些是独立的 Request 实例
request1 = tab1.request  # 绑定到 tab1 的 Request
request2 = tab2.request  # 绑定到 tab2 的 Request

# 请求继承 tab 的上下文
await tab1.go_to("https://site1.com")
await tab2.go_to("https://site2.com")

# 这些请求将具有不同的 cookie/会话上下文
response1 = await tab1.request.get("/api/data")  # 使用 site1.com 的 cookies
response2 = await tab2.request.get("/api/data")  # 使用 site2.com 的 cookies
```

!!! tip "混合自动化"
    该模块对于需要结合 UI 交互和 API 调用的混合自动化场景特别强大。例如，通过 UI 登录，然后使用已认证的会话进行 API 调用，无需手动处理 cookies 或令牌。

================================================
FILE: docs/zh/api/browser/tab.md
================================================
# Tab

::: pydoll.browser.tab.Tab
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/zh/api/commands/browser.md
================================================
# 浏览器命令

浏览器命令提供对浏览器实例及其配置的底层控制。

## 概述

浏览器命令模块处理浏览器级别的操作，例如版本信息、目标管理和浏览器范围的设置。

::: pydoll.commands.browser_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## 用法

浏览器命令通常由浏览器类在内部使用，用于管理浏览器实例：

```python
from pydoll.commands.browser_commands import get_version
from pydoll.connection.connection_handler import ConnectionHandler

# Get browser version information
connection = ConnectionHandler()
version_info = await get_version(connection)
```

## 可用命令

浏览器命令模块提供以下功能：

- 获取浏览器版本和用户代理信息
- 管理浏览器目标（标签页、窗口）
- 控制浏览器范围的设置和权限
- 处理浏览器生命周期事件

!!! note "Internal Usage"
    These commands are primarily used internally by the `Chrome` and `Edge` browser classes. Direct usage is recommended only for advanced scenarios. 

================================================
FILE: docs/zh/api/commands/dom.md
================================================
# DOM命令

DOM 命令模块提供了与网页文档对象模型交互的全面功能。

## 概述

DOM 命令模块是 Pydoll 中最重要的模块之一，它提供了查找、交互和操作网页上的 HTML 元素所需的所有功能。

::: pydoll.commands.dom_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## Usage

DOM commands are used extensively by the `WebElement` class and element finding methods:

## 用法

`WebElement` 类和元素查找方法广泛使用DOM 命令：

```python
from pydoll.commands.dom_commands import query_selector, get_attributes
from pydoll.connection.connection_handler import ConnectionHandler

# Find element and get its attributes
connection = ConnectionHandler()
node_id = await query_selector(connection, selector="#username")
attributes = await get_attributes(connection, node_id=node_id)
```

## 主要功能

DOM 命令模块提供以下功能：

### 元素定位
- `query_selector()` - 通过CSS选择器进行元素定位
- `query_selector_all()` - 通过CSS选择器进行元素定位（查找多个元素）
- `get_document()` - 获取document的根节点

### 元素交互
- `click_element()` - 点击元素
- `focus_element()` - 焦点置于元素
- `set_attribute_value()` - 设置元素属性
- `get_attributes()` - 获取元素属性

### 元素信息
- `get_box_model()` - 获取元素位置和尺寸
- `describe_node()` - 获取元素详细信息
- `get_outer_html()` - 获取元素的HTML内容

### DOM 操作
- `remove_node()` - 从DOM节点中删除元素
- `set_node_value()` - 设置元素值
- `request_child_nodes()` - 获取子元素

!!! tip "High-Level APIs"
    While these commands provide powerful low-level access, most users should use the higher-level `WebElement` class methods like `click()`, `type_text()`, and `get_attribute()` which use these commands internally. 

================================================
FILE: docs/zh/api/commands/fetch.md
================================================
# Fetch 命令

Fetch 命令使用 Fetch API 域提供高级网络请求处理和拦截功能。

## 概述

Fetch 命令模块支持复杂的网络请求管理，包括请求修改、响应拦截和身份验证处理。

::: pydoll.commands.fetch_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## 用法

Fetch 命令用于高级网络拦截和请求处理：

```python
from pydoll.commands.fetch_commands import enable, request_paused, continue_request
from pydoll.connection.connection_handler import ConnectionHandler

# Enable fetch domain
connection = ConnectionHandler()
await enable(connection, patterns=[{
    "urlPattern": "*",
    "requestStage": "Request"
}])

# Handle paused requests
async def handle_paused_request(request_id, request):
    # Modify request or continue as-is
    await continue_request(connection, request_id=request_id)
```

## 关键功能

fetch 命令模块提供以下功能：

### 请求拦截
- `enable()` - 激活fetch模式
- `disable()` - 关闭fetch模式
- `continue_request()` - 继续请求（放行）
- `fail_request()` - 返回特定错误请求

### 修改请求
- 修改请求headers
- 更改请求 URL
- 更改请求方法（GET、POST 等）
- 修改请求body

### 响应处理
- `fulfill_request()` - 提供自定义响应
- `get_response_body()` - 获取响应内容
- 修改响应头
- 响应状态码控制

### 身份验证
- `continue_with_auth()` - 处理身份验证挑战
- 基本身份验证支持
- 自定义身份验证流程

## 高级功能

### 基于模式的拦截

```python
# Intercept specific URL patterns
patterns = [
    {"urlPattern": "*/api/*", "requestStage": "Request"},
    {"urlPattern": "*.js", "requestStage": "Response"},
    {"urlPattern": "https://example.com/*", "requestStage": "Request"}
]

await enable(connection, patterns=patterns)
```

### 请求修改
```python
# Modify intercepted requests
async def modify_request(request_id, request):
    # Add authentication header
    headers = request.headers.copy()
    headers["Authorization"] = "Bearer token123"
    
    # Continue with modified headers
    await continue_request(
        connection,
        request_id=request_id,
        headers=headers
    )
```

### 响应模拟
```python
# Mock API responses
await fulfill_request(
    connection,
    request_id=request_id,
    response_code=200,
    response_headers=[
        {"name": "Content-Type", "value": "application/json"},
        {"name": "Access-Control-Allow-Origin", "value": "*"}
    ],
    body='{"status": "success", "data": {"mocked": true}}'
)
```

### 身份验证处理
```python
# Handle authentication challenges
await continue_with_auth(
    connection,
    request_id=request_id,
    auth_challenge_response={
        "response": "ProvideCredentials",
        "username": "user",
        "password": "pass"
    }
)
```

## 请求阶段

Fetch 命令可以在不同阶段拦截请求：

| 阶段 | 描述 | 用例 |
|-------|-------------|-----------|
| 请求 | 请求发送前 | 修改标头、URL 和方法 |
| 响应 | 收到响应后 | 模拟响应，修改内容 |

## 错误处理

```python
# Fail requests with specific errors
await fail_request(
    connection,
    request_id=request_id,
    error_reason="ConnectionRefused"  # or "AccessDenied", "TimedOut", etc.
)
```

## 与网络命令集成

Fetch 命令与网络命令协同工作，但提供更精细的控制：

- **网络命令**：更广泛的网络监控和控制
- **Fetch 命令**：特定的请求/响应拦截和修改

!!! tip "Performance Considerations"
    Fetch interception can impact page loading performance. Use specific URL patterns and disable when not needed to minimize overhead. 

================================================
FILE: docs/zh/api/commands/index.md
================================================
# 命令概述

命令模块提供了与Chrome DevTools协议(CDP)域交互的高级接口。每个命令模块对应一个特定的CDP域，并提供执行各种浏览器操作的方法。

## 可用命令模块

### 浏览器命令
- **模块**: `browser_commands.py`
- **用途**: 浏览器级别操作和窗口管理
- **文档**: [浏览器命令](browser.md)

### DOM命令
- **模块**: `dom_commands.py`
- **用途**: DOM树操作和元素操作
- **文档**: [DOM命令](dom.md)

### 输入命令
- **模块**: `input_commands.py`
- **用途**: 输入事件模拟(键盘、鼠标、触摸)
- **文档**: [输入命令](input.md)

### 网络命令
- **模块**: `network_commands.py`
- **用途**: 网络监控和请求拦截
- **文档**: [网络命令](network.md)

### 页面命令
- **模块**: `page_commands.py`
- **用途**: 页面生命周期管理和导航
- **文档**: [页面命令](page.md)

### 运行时命令
- **模块**: `runtime_commands.py`
- **用途**: JavaScript执行和运行时管理
- **文档**: [运行时命令](runtime.md)

### 存储命令
- **模块**: `storage_commands.py`
- **用途**: 浏览器存储访问(cookies、本地存储等)
- **文档**: [存储命令](storage.md)

### 目标命令
- **模块**: `target_commands.py`
- **用途**: 目标管理和标签页操作
- **文档**: [目标命令](target.md)

### 获取命令
- **模块**: `fetch_commands.py`
- **用途**: 网络请求拦截和修改
- **文档**: [获取命令](fetch.md)

## 使用模式

命令通常通过浏览器或标签页实例访问：

```python
from pydoll.browser.chromium import Chrome

# 初始化浏览器
browser = Chrome()
await browser.start()

# 获取活动标签页
tab = await browser.get_active_tab()

# 通过标签页使用命令
await tab.navigate("https://example.com")
element = await tab.find(id="button")
await element.click()
```

## 命令结构

每个命令模块遵循一致的模式：
- **静态方法**: 用于直接命令执行
- **类型提示**: 使用协议类型的完整类型安全
- **错误处理**: 对CDP错误的正确异常处理
- **文档**: 包含示例的全面文档字符串 

================================================
FILE: docs/zh/api/commands/input.md
================================================
# 输入命令

输入命令处理鼠标和键盘交互，提供真人仿真的输入模拟。

## 概述

输入命令模块提供模拟用户输入的功能，包括鼠标移动、点击、键盘输入和按键操作。

::: pydoll.commands.input_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## 用法

输入命令由元素交互方法使用，可直接用于高级输入场景：

```python
from pydoll.commands.input_commands import dispatch_mouse_event, dispatch_key_event
from pydoll.connection.connection_handler import ConnectionHandler

# Simulate mouse click
connection = ConnectionHandler()
await dispatch_mouse_event(
    connection, 
    type="mousePressed", 
    x=100, 
    y=200, 
    button="left"
)

# Simulate keyboard typing
await dispatch_key_event(
    connection,
    type="keyDown",
    key="Enter"
)
```

## 主要功能

输入命令模块提供以下函数：

### 鼠标事件
- `dispatch_mouse_event()` - 鼠标点击、移动和滚轮事件
- 鼠标按键状态（左键、右键、中键）
- 基于坐标的定位
- 拖放操作


### 键盘事件
- `dispatch_key_event()` - 键盘按下和释放事件
- `insert_text()` - 直接插入文本
- 特殊键处理（Enter、Tab、箭头键等）
- 修饰键（Ctrl、Alt、Shift）


### 触摸事件
- 触摸屏模拟
- 多点触控手势
- 触摸坐标和压力控制

## 仿真行为

输入命令支持仿真行为模式：

- 平滑的鼠标移动曲线
- 真实的打字速度和模式
- 操作之间随机的微延迟
- 压力感应触摸事件

!!! tip "Element Methods"
    For most use cases, use the higher-level element methods like `element.click()` and `element.type_text()` which provide a more convenient API and handle common scenarios automatically. 

================================================
FILE: docs/zh/api/commands/network.md
================================================
# 网络命令

网络命令提供对网络请求、响应和浏览器网络行为的全面控制。

## 概述

网络命令模块支持请求拦截、响应修改、Cookie 管理和网络监控功能。

::: pydoll.commands.network_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## 用法

网络命令用于请求拦截和网络监控等高级场景：

```python
from pydoll.commands.network_commands import enable, set_request_interception
from pydoll.connection.connection_handler import ConnectionHandler

# Enable network monitoring
connection = ConnectionHandler()
await enable(connection)

# Enable request interception
await set_request_interception(connection, patterns=[{"urlPattern": "*"}])
```

## 主要功能

网络命令模块提供以下功能：


### 请求管理
- `enable()` / `disable()` - 启用/禁用网络监控
- `set_request_interception()` - 拦截并修改请求
- `continue_intercepted_request()` - 继续或修改拦截的请求
- `get_request_post_data()` - 获取请求体数据


### 响应处理
- `get_response_body()` - 获取响应内容
- `fulfill_request()` - 提供自定义响应
- `fail_request()` - 模拟网络异常

### Cookie 管理
- `get_cookies()` - 获取浏览器 Cookie
- `set_cookies()` - 设置浏览器 Cookie
- `delete_cookies()` - 删除指定 Cookie
- `clear_browser_cookies()` - 清除所有 Cookie

### 缓存控制
- `clear_browser_cache()` - 清除浏览器缓存
- `set_cache_disabled()` - 禁用浏览器缓存
- `get_response_body_for_interception()` - 获取缓存的响应

### 安全和标头
- `set_user_agent_override()` - 覆盖用户代理
- `set_extra_http_headers()` - 添加自定义标头
- `emulate_network_conditions()` - 模拟网络连接状况

## 高级用例

### 请求拦截

```python
# 拦截修改请求
await set_request_interception(connection, patterns=[
    {"urlPattern": "*/api/*", "requestStage": "Request"}
])

# 拦截请求处理
async def handle_request(request):
    if "api/login" in request.url:
        # 修改请求头
        headers = request.headers.copy()
        headers["Authorization"] = "Bearer token"
        await continue_intercepted_request(
            connection, 
            request_id=request.request_id,
            headers=headers
        )
```

### 响应模拟
```python
# 模拟 API 响应
await fulfill_request(
    connection,
    request_id=request_id,
    response_code=200,
    response_headers={"Content-Type": "application/json"},
    body='{"status": "success"}'
)
```

!!! warning "Performance Impact"
    Network interception can impact page loading performance. Use selectively and disable when not needed. 

================================================
FILE: docs/zh/api/commands/page.md
================================================
# 页面命令

页面命令处理页面导航、生命周期事件和页面操作。

## 概述

页面命令模块提供页面间导航、管理页面生命周期、处理 JavaScript 执行以及控制页面行为的功能。

::: pydoll.commands.page_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## 用法

“Tab”类广泛使用页面命令进行导航和页面管理：

```python
from pydoll.commands.page_commands import navigate, reload, enable
from pydoll.connection.connection_handler import ConnectionHandler

# Navigate to a URL
connection = ConnectionHandler()
await enable(connection)  # Enable page events
await navigate(connection, url="https://example.com")

# Reload the page
await reload(connection)
```

## 关键功能

页面命令模块提供以下函数：

### 导航
- `navigate()` - 访问URL
- `reload()` - 重新加载当前页面
- `go_back()` - 后退一步
- `go_forward()` - 前进一步
- `stop_loading()` - 停止页面加载

### 页面生命周期
- `enable()` / `disable()` - 启用/禁用页面事件
- `get_frame_tree()` - 获取页面框架结构
- `get_navigation_history()` - 获取导航历史记录

### 内容管理
- `get_resource_content()` - 获取页面资源内容
- `search_in_resource()` - 在页面资源内搜索
- `set_document_content()` - 设置页面 HTML 内容

### 截图和 PDF
- `capture_screenshot()` - 页面截图
- `print_to_pdf()` - 将页面保存为PDF
- `capture_snapshot()` - 页面快照

### JavaScript 执行
- `add_script_to_evaluate_on_new_document()` - 添加启动脚本(在网页加载前注入js)
- `remove_script_to_evaluate_on_new_document()` - 移除启动脚本

### 页面设置
- `set_lifecycle_events_enabled()` - 控制生命周期事件
- `set_ad_blocking_enabled()` - 启用/禁用广告拦截
- `set_bypass_csp()` - 绕过内容安全策略

## 高级功能
### 框架管理

```python
# Get all frames in the page
frame_tree = await get_frame_tree(connection)
for frame in frame_tree.child_frames:
    print(f"Frame: {frame.frame.url}")
```

### 资源拦截
```python
# Get resource content
content = await get_resource_content(
    connection, 
    frame_id=frame_id, 
    url="https://example.com/script.js"
)
```

### 页面事件
页面命令可与各种页面事件配合使用：
- `Page.loadEventFired` - 页面加载完成
- `Page.domContentEventFired` - DOM 内容已加载
- `Page.frameNavigated` - 框架访问结束
- `Page.frameStartedLoading` - 框架加载开始


!!! 小提示“Tab 类集成”
大多数页面操作都可以通过 `Tab` 类方法实现，例如 `tab.go_to()`、`tab.reload()` 和 `tab.screenshot()`，这些方法提供了更便捷的 API。

================================================
FILE: docs/zh/api/commands/runtime.md
================================================
# 运行时命令

运行时命令提供 JavaScript 执行功能和运行时环境管理。

## 概述

运行时命令模块支持在浏览器上下文中执行 JavaScript 代码、检查对象以及控制运行时环境。

::: pydoll.commands.runtime_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## 用法

运行时命令用于 JavaScript 执行和运行时管理：

```python
from pydoll.commands.runtime_commands import evaluate, enable
from pydoll.connection.connection_handler import ConnectionHandler

# Enable runtime events
connection = ConnectionHandler()
await enable(connection)

# Execute JavaScript
result = await evaluate(
    connection, 
    expression="document.title",
    return_by_value=True
)
print(result.value)  # Page title
```

## 主要功能

运行时命令模块提供以下功能：

### JavaScript 执行
- `evaluate()` - 执行 JavaScript 表达式
- `call_function_on()` - 调用对象上的函数
- `compile_script()` - 编译 JavaScript 以供复用
- `run_script()` - 运行已编译的脚本

### 对象管理
- `get_properties()` - 获取对象属性
- `release_object()` - 释放对象引用
- `release_object_group()` - 释放对象组

### 运行时控制
- `enable()` / `disable()` - 启用/禁用运行时事件
- `discard_console_entries()` - 清除控制台记录
- `set_custom_object_formatter_enabled()` - 启用自定义格式化程序

### 异常处理
- `set_async_call_stack_depth()` - 设置调用堆栈深度
- 异常捕获和报告
- 错误对象检查

## 高级用法

### 复杂的 JavaScript 执行

```python
# 执行带有错误处理的复杂 JavaScript
script = """
try {
    const elements = document.querySelectorAll('.item');
    return Array.from(elements).map(el => ({
        text: el.textContent,
        href: el.href
    }));
} catch (error) {
    return { error: error.message };
}
"""

result = await evaluate(
    connection,
    expression=script,
    return_by_value=True,
    await_promise=True
)
```

### 对象检查
```python
# Get detailed object properties
properties = await get_properties(
    connection,
    object_id=object_id,
    own_properties=True,
    accessor_properties_only=False
)

for prop in properties:
    print(f"{prop.name}: {prop.value}")
```

### 控制台集成
运行时命令与浏览器控制台集成：
- 控制台消息和错误
- 控制台 API 方法调用
- 自定义控制台格式化程序

!!! note "Performance Considerations"
    JavaScript execution through runtime commands can be slower than native browser execution. Use judiciously for complex operations. 

================================================
FILE: docs/zh/api/commands/storage.md
================================================
# 存储命令

存储命令提供全面的浏览器存储管理，包括 Cookie、localStorage、sessionStorage 和 IndexedDB。

## 概述

存储命令模块支持管理所有浏览器存储机制，提供数据持久化和检索功能。

::: pydoll.commands.storage_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## 用法

存储命令用于跨不同机制管理浏览器存储：

```python
from pydoll.commands.storage_commands import get_cookies, set_cookies, clear_data_for_origin
from pydoll.connection.connection_handler import ConnectionHandler

# Get cookies for a domain
connection = ConnectionHandler()
cookies = await get_cookies(connection, urls=["https://example.com"])

# Set a new cookie
await set_cookies(connection, cookies=[{
    "name": "session_id",
    "value": "abc123",
    "domain": "example.com",
    "path": "/",
    "httpOnly": True,
    "secure": True
}])

# Clear all storage for an origin
await clear_data_for_origin(
    connection,
    origin="https://example.com",
    storage_types="all"
)
```

## 关键功能

存储命令模块提供以下函数：

### Cookie 管理
- `get_cookies()` - 通过 URL 或域名获取 Cookie
- `set_cookies()` - 设置新 Cookie
- `delete_cookies()` - 删除特定 Cookie
- `clear_cookies()` - 清除所有 Cookie


### 本地存储
- `get_dom_storage_items()` - 获取localStorage
- `set_dom_storage_item()` - 设置localStorage
- `remove_dom_storage_item()` - 移除localStorage
- `clear_dom_storage()` - 清除localStorage

### 会话存储
- 会话存储操作（类似于本地存储）
- 特定会话的数据管理
- 选项卡隔离存储

### IndexedDB
- `get_database_names()` - 获取 IndexedDB 数据库
- `request_database()` - 访问数据库结构
- `request_data()` - 查询数据库数据
- `clear_object_store()` - 清除对象存储

### 缓存存储
- `request_cache_names()` - 获取缓存名称
- `request_cached_response()` - 获取缓存响应
- `delete_cache()` - 删除缓存条目

### 应用程序缓存（已弃用）
- 支持旧版应用程序缓存
- 基于清单的缓存

## 高级功能

### 批量操作
```python
# Clear all storage types for multiple origins
origins = ["https://example.com", "https://api.example.com"]
for origin in origins:
    await clear_data_for_origin(
        connection,
        origin=origin,
        storage_types="cookies,local_storage,session_storage,indexeddb"
    )
```

### 存储配额
```python
# Get storage quota information
quota_info = await get_usage_and_quota(connection, origin="https://example.com")
print(f"Used: {quota_info.usage} bytes")
print(f"Quota: {quota_info.quota} bytes")
```

### Cross-Origin 存储
```python
# Manage storage across different origins
await set_cookies(connection, cookies=[{
    "name": "cross_site_token",
    "value": "token123",
    "domain": ".example.com",  # Applies to all subdomains
    "sameSite": "None",
    "secure": True
}])
```

## 存储类型

该模块支持多种存储机制：

| 存储类型 | 持久性 | 范围 | 容量 |
|-----------|----------|----------|----------|
| Cookies | 持久性 | 域/路径 | 每个 cookie 约 4KB |
| localStorage | 持久性 | 来源 | 约 5-10MB |
| sessionStorage | 会话 | Tab | 约 5-10MB |
| IndexedDB | 持久性 | 来源 | 大容量 (GB+) |
| Cache API | 持久性 | 来源 | 大容量 |

!!! warning "Privacy Considerations"
    Storage operations can affect user privacy. Always handle storage data responsibly and in compliance with privacy regulations. 

================================================
FILE: docs/zh/api/commands/target.md
================================================
# Target命令

Target命令管理浏览器目标，包括标签页、窗口和其他浏览上下文。

## 概述

Target命令模块提供创建、管理和控制浏览器目标（例如标签页、弹出窗口和服务工作线程）的功能。

::: pydoll.commands.target_commands
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## 用法

Target命令由浏览器类内部使用，用于管理标签页和窗口：

```python
from pydoll.commands.target_commands import get_targets, create_target, close_target
from pydoll.connection.connection_handler import ConnectionHandler

# Get all browser targets
connection = ConnectionHandler()
targets = await get_targets(connection)

# Create a new tab
new_target = await create_target(connection, url="https://example.com")

# Close a target
await close_target(connection, target_id=new_target.target_id)
```

## 主要功能

Target命令模块提供以下功能：


### Target管理
- `get_targets()` - 列出所有浏览器Target
- `create_target()` - 创建新的标签页或窗口
- `close_target()` - 关闭特定Target
- `activate_target()` - 将Target置于前台

### Target 信息
- `get_target_info()` - 获取详细的Target信息
- Target类型：页面、background_page、service_worker、浏览器
- Target状态：已连接、已分离、崩溃

### Session 管理
- `attach_to_target()` - 附加到Target进行控制
- `detach_from_target()` - 分离Target
- `send_message_to_target()` - 向Target发送命令

### 浏览器上下文
- `create_browser_context()` - 创建独立的浏览器上下文
- `dispose_browser_context()` - 移除浏览器上下文
- `get_browser_contexts()` - 列出浏览器上下文

## 目标类型

可以管理不同类型的目标：

### 页面 Targets
```python
# Create a new tab
page_target = await create_target(
    connection,
    url="https://example.com",
    width=1920,
    height=1080,
    browser_context_id=None  # Default context
)
```

### 弹窗
```python
# Create a popup window
popup_target = await create_target(
    connection,
    url="https://popup.example.com",
    width=800,
    height=600,
    new_window=True
)
```

### 无痕上下文
```python
# Create incognito browser context
incognito_context = await create_browser_context(connection)

# Create tab in incognito context
incognito_tab = await create_target(
    connection,
    url="https://private.example.com",
    browser_context_id=incognito_context.browser_context_id
)
```

!!! info "Headless 与 Headed：上下文如何呈现"
    浏览器上下文是逻辑上的隔离环境。在 Headed 模式下，在新的上下文中创建的第一个页面通常会打开一个新的系统窗口。 在 Headless 模式下不会显示窗口——隔离依然存在于后台（cookies、storage、缓存与认证状态仍按上下文分离）。在 CI/Headless 环境中优先使用上下文以获得更高性能与更干净的隔离。

## 高级特性

### 目标事件
Target命令可与各种Target事件配合使用：
- `Target.targetCreated` - 新Target创建
- `Target.targetDestroyed` - Target关闭
- `Target.targetInfoChanged` - Target信息更新
- `Target.targetCrashed` - Target崩溃

### 多Target协调

```python
# Manage multiple tabs
targets = await get_targets(connection)
page_targets = [t for t in targets if t.type == "page"]

for target in page_targets:
    # Perform operations on each tab
    await activate_target(connection, target_id=target.target_id)
    # ... do work in this tab
```

### Target 隔离
```python
# Create isolated browser context for testing
test_context = await create_browser_context(connection)

# All targets in this context are isolated
test_tab1 = await create_target(
    connection, 
    url="https://test1.com",
    browser_context_id=test_context.browser_context_id
)

test_tab2 = await create_target(
    connection,
    url="https://test2.com", 
    browser_context_id=test_context.browser_context_id
)
```

!!! note "Browser Integration"
    Target commands are primarily used internally by the `Chrome` and `Edge` browser classes. The high-level browser APIs provide more convenient methods for tab management. 

================================================
FILE: docs/zh/api/connection/connection.md
================================================
# 连接处理器

::: pydoll.connection.connection_handler.ConnectionHandler
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/zh/api/connection/managers.md
================================================
# 连接管理器

## 命令管理器

::: pydoll.connection.managers.commands_manager.CommandsManager
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3

## 事件管理器

::: pydoll.connection.managers.events_manager.EventsManager
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3 

================================================
FILE: docs/zh/api/core/constants.md
================================================
# 常量

本节记录了 Pydoll 中使用的所有常量、枚举和配置值。

::: pydoll.constants
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      group_by_category: true
      members_order: source 

================================================
FILE: docs/zh/api/core/exceptions.md
================================================
# 异常

本节记录了 Pydoll 操作可能引发的所有自定义异常。

::: pydoll.exceptions
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      group_by_category: true
      members_order: source 

================================================
FILE: docs/zh/api/core/utils.md
================================================
# 实用功能

本节记录了 Pydoll 中使用的实用程序函数和辅助类。

::: pydoll.utils
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      group_by_category: true
      members_order: source 

================================================
FILE: docs/zh/api/elements/mixins.md
================================================
# 元素mixins

mixins 模块提供可复用的功能，可以将其混合到元素类中以扩展其功能。

## 元素定位mixins

`FindElementsMixin` 为包含它的类提供元素查找功能。

::: pydoll.elements.mixins.find_elements_mixin
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      filters:
        - "!^_"
        - "!^__"

## 用法

Mixin 通常由库内部使用，用于组合功能。`Tab` 和 `WebElement` 等类使用 `FindElementsMixin` 来提供元素定位方法：

```python
# 这些方法来自 FindElementsMixin
element = await tab.find(id="username")
elements = await tab.find(class_name="item", find_all=True)
element = await tab.query("#submit-button")
```


## 可用方法

`FindElementsMixin` 提供了多种元素定位的方法：

- `find()` - 使用关键字参数的现代元素查找方法
- `query()` - CSS 选择器和 XPath 查询
- `find_element()` - 旧版元素定位方法
- `find_elements()` - 查找多个元素的旧版方法

!!! 提示“现代 vs 传统”
`find()` 方法是最新的、推荐的查找元素的方法。`find_element()` 和 `find_elements()` 方法保留下来，以实现向后兼容。

================================================
FILE: docs/zh/api/elements/shadow_root.md
================================================
# ShadowRoot

::: pydoll.elements.shadow_root.ShadowRoot
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      members_order: source
      group_by_category: true


================================================
FILE: docs/zh/api/elements/web_element.md
================================================
# 网页元素

::: pydoll.elements.web_element.WebElement
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
      members_order: source
      group_by_category: true 

================================================
FILE: docs/zh/api/index.md
================================================
# API 参考

这里是Pydoll API 参考！本节提供 Pydoll 库中所有类、方法和函数的详尽文档。

## 概述

Pydoll 几个关键模块组成，每个模块在浏览器自动化中都有特定的用途：

### 浏览器模块
浏览器模块可以管理浏览器实例和生命周期。

- **[Chrome](browser/chrome.md)** - Chrome 浏览器自动化
- **[Edge](browser/edge.md)** - Microsoft Edge 浏览器自动化  
- **[Options](browser/options.md)** - 浏览器配置选项  
- **[Tab](browser/tab.md)** - 页面标签和交互  
- **[Requests](browser/requests.md)** - 浏览器上下文中的 HTTP 请求
- **[Managers](browser/managers.md)** - 浏览器生命周期管理器  

### 元素模块
元素模块提供与网页元素交互的功能。

- **[WebElement](elements/web_element.md)** - 网页元素交互
- **[Mixins](elements/mixins.md)** - 可复用的元素交互功能

### 连接模块
连接模块通过 Chrome DevTools 协议处理与浏览器的通信。

- **[Connection Handler](connection/connection.md)** - WebSocket连接管理器
- **[Managers](connection/managers.md)** - 连接生命周期管理器

### 命令模块
命令模块提供低级 Chrome DevTools 协议命令实现。

- **[Commands Overview](commands/index.md)** - CDP command implementations by domain

### 协议模块
协议模块实现了 Chrome DevTools 协议命令和事件。

- **[Base Types](protocol/base.md)** - Base types for Chrome DevTools Protocol
- **[Browser](protocol/browser.md)** - Browser domain commands and events
- **[DOM](protocol/dom.md)** - DOM domain commands and events
- **[Fetch](protocol/fetch.md)** - Fetch domain commands and events
- **[Input](protocol/input.md)** - Input domain commands and events
- **[Network](protocol/network.md)** - Network domain commands and events
- **[Page](protocol/page.md)** - Page domain commands and events
- **[Runtime](protocol/runtime.md)** - Runtime domain commands and events
- **[Storage](protocol/storage.md)** - Storage domain commands and events
- **[Target](protocol/target.md)** - Target domain commands and events

### 核心模块
核心模块包含基础程序、常量和异常。

- **[Constants](core/constants.md)** - 库常量和枚举
- **[Exceptions](core/exceptions.md)** - 自定义异常类
- **[Utils](core/utils.md)** - 实用功能

## 快捷导航

### 常用类

| 类                 | 功能           | 模块                            |
|-------------------|--------------|-------------------------------|
| `Chrome`          | Chrome浏览器自动化 | `pydoll.browser.chromium`     |
| `Edge`            | Edge浏览器自动化   | `pydoll.browser.chromium`     |
| `Tab`             | 标签页交互和控制     | `pydoll.browser.tab`          |
| `WebElement`      | 元素交互         | `pydoll.elements.web_element` |
| `ChromiumOptions` | 浏览器配置        | `pydoll.browser.options`      |

### 关键枚举和常量

| 名称               | 功能 | 模块 |
|------------------|---------|--------|
| `By`             | 元素选择器策略 | `pydoll.constants` |
| `Key`            | 键盘按键常量 | `pydoll.constants` |
| `PermissionType` | 浏览器权限类型 | `pydoll.constants` |

### 常见异常类型

| 异常                   | 原因        | 模块                  |
|----------------------|-----------|---------------------|
| `ElementNotFound`    | 元素在DOM未找到 | `pydoll.exceptions` |
| `WaitElementTimeout` | 元素等待超时    | `pydoll.exceptions` |
| `BrowserNotStarted`  | 浏览器未开启    | `pydoll.exceptions` |

## 使用模式

### 基本浏览器自动化

```python
from pydoll.browser.chromium import Chrome

async with Chrome() as browser:
    tab = await browser.start()
    await tab.go_to("https://example.com")
    element = await tab.find(id="my-element")
    await element.click()
```

### 元素定位

```python
# Using the modern find() method
element = await tab.find(id="username")
element = await tab.find(tag_name="button", class_name="submit")

# Using CSS selectors or XPath
element = await tab.query("#username")
element = await tab.query("//button[@class='submit']")
```

### 事件处理

```python
await tab.enable_page_events()
await tab.on('Page.loadEventFired', handle_page_load)
```

## 类型提示

Pydoll 具有完整的类型支持，并提供全面的类型提示，以提供更好的 IDE 支持和代码安全性。所有公共 API 均包含正确的类型注释。

```python
from typing import Optional, List
from pydoll.elements.web_element import WebElement

# Methods return properly typed objects
element: Optional[WebElement] = await tab.find(id="test", raise_exc=False)
elements: List[WebElement] = await tab.find(class_name="item", find_all=True)
```

## Async/Await 支持

所有 Pydoll 操作都是异步的，必须与 `async`/`await` 一起使用：

```python
import asyncio

async def main():
    # All Pydoll operations are async
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to("https://example.com")
        
asyncio.run(main())
```

浏览以下部分以了解每个模块的完整 API 文档。

================================================
FILE: docs/zh/api/protocol/base.md
================================================
# 协议基础类型

Chrome DevTools 协议命令、响应和事件的基础类型和结构。

## 基础类型

::: pydoll.protocol.base
    options:
      show_root_heading: true
      show_source: false
      heading_level: 3
      group_by_category: true
      members_order: source
      filters:
        - "!^__"

================================================
FILE: docs/zh/api/protocol/browser.md
================================================
# 浏览器协议

Chrome DevTools 协议的浏览器域命令、事件和类型。

## 方法

::: pydoll.protocol.browser.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## 事件

::: pydoll.protocol.browser.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## 类型

::: pydoll.protocol.browser.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/zh/api/protocol/dom.md
================================================
# DOM 协议

Chrome DevTools 协议的 DOM 域命令、事件和类型。

## 方法

::: pydoll.protocol.dom.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## 事件

::: pydoll.protocol.dom.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## 类型

::: pydoll.protocol.dom.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/zh/api/protocol/fetch.md
================================================
# 获取协议

Chrome DevTools 协议的获取域命令、事件和类型。

## 方法

::: pydoll.protocol.fetch.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## 事件

::: pydoll.protocol.fetch.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## 类型

::: pydoll.protocol.fetch.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/zh/api/protocol/input.md
================================================
# 输入协议

Chrome DevTools 协议的输入域命令、事件和类型。

## 方法

::: pydoll.protocol.input.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## 事件

::: pydoll.protocol.input.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## 类型

::: pydoll.protocol.input.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/zh/api/protocol/network.md
================================================
# 网络协议

Chrome DevTools 协议的网络域命令、事件和类型。

## 方法

::: pydoll.protocol.network.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## 事件

::: pydoll.protocol.network.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## 类型

::: pydoll.protocol.network.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/zh/api/protocol/page.md
================================================
# 页面协议

Chrome DevTools 协议的页面域命令、事件和类型。

## 方法

::: pydoll.protocol.page.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## 事件

::: pydoll.protocol.page.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## 类型

::: pydoll.protocol.page.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/zh/api/protocol/runtime.md
================================================
# 运行时协议

Chrome DevTools 协议的运行时域命令、事件和类型。

## 方法

::: pydoll.protocol.runtime.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## 事件

::: pydoll.protocol.runtime.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## 类型

::: pydoll.protocol.runtime.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/zh/api/protocol/storage.md
================================================
# 存储协议

Chrome DevTools 协议的存储域命令、事件和类型。

## 方法

::: pydoll.protocol.storage.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
## 事件

::: pydoll.protocol.storage.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
## 类型

::: pydoll.protocol.storage.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/zh/api/protocol/target.md
================================================
# 目标协议

Chrome DevTools 协议的目标域命令、事件和类型。

## 方法

::: pydoll.protocol.target.methods
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

## 事件

::: pydoll.protocol.target.events
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2
## 类型

::: pydoll.protocol.target.types
    options:
      show_root_heading: true
      show_source: false
      heading_level: 2

================================================
FILE: docs/zh/deep-dive/architecture/browser-domain.md
================================================
# 浏览器域架构

浏览器域代表 Pydoll 自动化层次结构的最高级别，管理浏览器进程生命周期、CDP 连接、上下文隔离和全局浏览器操作。本文档探讨了浏览器级控制的内部架构、设计决策和技术实现。

!!! info "实用指南"
    有关实际示例和使用模式，请参阅[浏览器管理](../features/browser-management/tabs.md)和[浏览器上下文](../features/browser-management/contexts.md)指南。

## 架构概述

浏览器域位于进程管理、协议通信和资源协调的交叉点。它协调多个专门的组件，为浏览器自动化提供统一的接口：

```mermaid
graph TB
    subgraph "Browser Domain"
        Browser[Browser Instance]
        Browser --> ConnectionHandler[Connection Handler]
        Browser --> ProcessManager[Process Manager]
        Browser --> ProxyManager[Proxy Manager]
        Browser --> TempDirManager[Temp Directory Manager]
        Browser --> TabRegistry[Tab Registry]
        Browser --> ContextAuth[Context Proxy Auth]
    end
    
    ConnectionHandler <--> |WebSocket| CDP[Chrome DevTools Protocol]
    ProcessManager --> |Manages| BrowserProcess[Browser Process]
    TabRegistry --> Tab1[Tab Instance 1]
    TabRegistry --> Tab2[Tab Instance 2]
    TabRegistry --> Tab3[Tab Instance N]
    
    CDP <--> BrowserProcess
```

### 层次结构与抽象

浏览器域被实现为一个**抽象基类**，定义了所有浏览器实现的契约：

```python
class Browser(ABC):
    """Abstract base class for browser automation via CDP."""
    
    @abstractmethod
    def _get_default_binary_location(self) -> str:
        """子类必须提供特定于浏览器的可执行文件路径。"""
        pass
    
    async def start(self, headless: bool = False) -> Tab:
        """所有浏览器共享的具体实现。"""
        # 1. 解析二进制位置
        # 2. 设置用户数据目录
        # 3. 启动浏览器进程
        # 4. 验证 CDP 连接
        # 5. 配置代理（如果需要）
        # 6. 返回初始标签页
```

这种设计实现了**多态性** - Chrome、Edge 和其他基于 Chromium 的浏览器共享 99% 的代码，仅在可执行文件路径和次要标志变化上有所不同。

## 组件架构

Browser 类协调多个专门的管理器，每个管理器负责浏览器自动化的特定方面。理解这些组件是理解 Pydoll 设计的关键。

### 连接处理器

ConnectionHandler 是 Pydoll 和浏览器进程之间的**通信桥梁**。它管理：

- **WebSocket 生命周期**：连接建立、保持活动、重新连接
- **命令执行**：发送 CDP 命令并等待响应
- **事件分发**：将 CDP 事件路由到已注册的回调
- **回调注册表**：维护每个连接的事件监听器

```python
class Browser:
    def __init__(self, ...):
        # ConnectionHandler 使用端口或 WebSocket 地址初始化
        self._connection_handler = ConnectionHandler(self._connection_port)
    
    async def _execute_command(self, command, timeout=10):
        """所有 CDP 命令都通过连接处理器流动。"""
        return await self._connection_handler.execute_command(command, timeout)
```

!!! info "连接层深入探讨"
    有关 WebSocket 通信、命令/响应流程和异步模式的详细信息，请参阅[连接层架构](./connection-layer.md)。

### 进程管理器

BrowserProcessManager 处理**操作系统进程生命周期**：

```python
class BrowserProcessManager:
    def start_browser_process(self, binary, port, arguments):
        """
        1. 使用二进制路径 + 参数构造命令行
        2. 使用适当的 stdio 处理生成子进程
        3. 监控进程启动
        4. 存储进程句柄以供后续终止
        """
        
    def stop_process(self):
        """
        1. 尝试优雅终止（SIGTERM）
        2. 等待进程退出
        3. 如果超时则强制终止（SIGKILL）
        4. 清理进程资源
        """
```

**为什么要分离进程管理？**

- **可测试性**：进程管理器可以在单元测试中被模拟
- **跨平台**：封装特定于操作系统的进程处理
- **可靠性**：处理僵尸进程、孤立子进程等边缘情况

### 标签页注册表

Browser 维护一个 **Tab 实例注册表**以确保每个目标的单例行为：

```python
class Browser:
    def __init__(self, ...):
        self._tabs_opened: dict[str, Tab] = {}
    
    async def new_tab(self, url='', browser_context_id=None) -> Tab:
        # 通过 CDP 创建目标
        response = await self._execute_command(
            TargetCommands.create_target(browser_context_id=browser_context_id)
        )
        target_id = response['result']['targetId']
        
        # 检查标签页是否已存在于注册表中
        if target_id in self._tabs_opened:
            return self._tabs_opened[target_id]
        
        # 创建新的 Tab 实例并注册它
        tab = Tab(self, target_id=target_id, ...)
        self._tabs_opened[target_id] = tab
        return tab
```

**为什么使用单例 Tab 实例？**

- **状态一致性**：对同一标签页的多个引用共享状态（已启用的域、回调）
- **内存效率**：防止同一目标的重复 Tab 实例
- **事件路由**：确保事件路由到正确的 Tab 实例

### 代理身份验证架构

Pydoll 通过 Fetch 域实现**自动代理身份验证**，以避免在 CDP 命令中暴露凭据。根据代理范围，实现使用**两种不同的机制**：

#### 机制 1：浏览器级代理身份验证（全局代理）

当通过 `ChromiumOptions` 配置代理时（适用于默认上下文中的所有标签页）：

```python
# 在 Browser.start() -> _configure_proxy() 中
async def _configure_proxy(self, private_proxy, proxy_credentials):
    # 在浏览器级别启用 Fetch
    await self.enable_fetch_events(handle_auth_requests=True)
    
    # 在浏览器级别注册回调（影响所有标签页）
    await self.on(FetchEvent.REQUEST_PAUSED, self._continue_request_callback, temporary=True)
    await self.on(FetchEvent.AUTH_REQUIRED, 
                  partial(self._continue_request_with_auth_callback,
                          proxy_username=credentials[0],
                          proxy_password=credentials[1]),
                  temporary=True)
```

**作用域：**浏览器级 WebSocket 连接 → 影响**默认上下文中的所有标签页**

#### 机制 2：标签页级代理身份验证（按上下文代理）

当通过 `create_browser_context(proxy_server=...)` 为每个上下文配置代理时：

```python
# 按上下文存储凭据
async def create_browser_context(self, proxy_server, ...):
    sanitized_proxy, extracted_auth = self._sanitize_proxy_and_extract_auth(proxy_server)
    
    response = await self._execute_command(
        TargetCommands.create_browser_context(proxy_server=sanitized_proxy)
    )
    context_id = response['result']['browserContextId']
    
    if extracted_auth:
        self._context_proxy_auth[context_id] = extracted_auth  # 按上下文存储
    
    return context_id

# 为该上下文中的每个标签页设置身份验证
async def _setup_context_proxy_auth_for_tab(self, tab, browser_context_id):
    creds = self._context_proxy_auth.get(browser_context_id)
    if not creds:
        return
    
    # 在标签页上启用 Fetch（标签页级 WebSocket）
    await tab.enable_fetch_events(handle_auth=True)
    
    # 在标签页上注册回调（仅影响此标签页）
    await tab.on(FetchEvent.REQUEST_PAUSED, 
                 partial(self._tab_continue_request_callback, tab=tab), 
                 temporary=True)
    await tab.on(FetchEvent.AUTH_REQUIRED,
                 partial(self._tab_continue_request_with_auth_callback,
                         tab=tab,
                         proxy_username=creds[0],
                         proxy_password=creds[1]),
                 temporary=True)
```

**作用域：**标签页级 WebSocket 连接 → 仅影响**该特定标签页**

#### 为什么使用两种机制？

| 方面 | 浏览器级 | 标签页级 |
|--------|---------------|-----------|
| **触发器** | `ChromiumOptions` 中的代理 | `create_browser_context()` 中的代理 |
| **WebSocket** | 浏览器级连接 | 标签页级连接 |
| **作用域** | 默认上下文中的所有标签页 | 仅该上下文中的标签页 |
| **效率** | 所有标签页一个监听器 | 每个标签页一个监听器 |
| **隔离** | 无上下文分离 | 每个上下文具有不同的凭据 |

**标签页级身份验证的设计理由：**

- **上下文隔离**：每个上下文可以有**不同的代理**和**不同的凭据**
- **CDP 限制**：Fetch 域不能在浏览器级别限定到特定上下文
- **权衡**：效率稍低（每个标签页一个监听器），但对于按上下文代理支持是必需的

这种架构确保**凭据永远不会出现在 CDP 日志中**，身份验证以透明方式处理。

!!! warning "Fetch 域副作用"
    - **浏览器级 Fetch**：暂时暂停默认上下文中**所有标签页的所有请求**，直到身份验证完成
    - **标签页级 Fetch**：暂时暂停**该特定标签页的所有请求**，直到身份验证完成
    
    这是 CDP 限制 - Fetch 启用请求拦截。身份验证完成后，Fetch 被禁用以最小化开销。

## 初始化和生命周期

### 构造函数设计

Browser 构造函数初始化所有内部组件，但**不启动浏览器进程**。这种分离允许在启动之前进行配置：

```python
class Browser(ABC):
    def __init__(
        self,
        options_manager: BrowserOptionsManager,
        connection_port: Optional[int] = None,
    ):
        # 1. 验证参数
        self._validate_connection_port(connection_port)
        
        # 2. 通过管理器初始化选项
        self.options = options_manager.initialize_options()
        
        # 3. 确定 CDP 端口（如果未指定则随机）
        self._connection_port = connection_port or randint(9223, 9322)
        
        # 4. 初始化专门的管理器
        self._proxy_manager = ProxyManager(self.options)
        self._browser_process_manager = BrowserProcessManager()
        self._temp_directory_manager = TempDirectoryManager()
        self._connection_handler = ConnectionHandler(self._connection_port)
        
        # 5. 初始化状态跟踪
        self._tabs_opened: dict[str, Tab] = {}
        self._context_proxy_auth: dict[str, tuple[str, str]] = {}
        self._ws_address: Optional[str] = None
```

**关键设计决策：**

- **延迟进程启动**：构造函数是同步的；`start()` 是异步的
- **端口灵活性**：随机端口防止并行自动化中的冲突
- **选项管理器模式**：用于浏览器特定配置的策略模式
- **组件组合**：专门的管理器而不是单体类

### 启动序列

`start()` 方法协调浏览器启动和连接：

```python
async def start(self, headless: bool = False) -> Tab:
    # 1. 解析二进制位置
    binary_location = self.options.binary_location or self._get_default_binary_location()
    
    # 2. 设置用户数据目录（临时或持久）
    self._setup_user_dir()
    
    # 3. 提取代理凭据（如果是私有代理）
    proxy_config = self._proxy_manager.get_proxy_credentials()
    
    # 4. 使用参数启动浏览器进程
    self._browser_process_manager.start_browser_process(
        binary_location, self._connection_port, self.options.arguments
    )
    
    # 5. 验证 CDP 端点是否响应
    await self._verify_browser_running()
    
    # 6. 配置代理身份验证（通过 Fetch 域）
    await self._configure_proxy(proxy_config[0], proxy_config[1])
    
    # 7. 获取第一个有效目标并创建 Tab
    valid_tab_id = await self._get_valid_tab_id(await self.get_targets())
    tab = Tab(self, target_id=valid_tab_id, connection_port=self._connection_port)
    self._tabs_opened[valid_tab_id] = tab
    
    return tab
```

!!! tip "为什么 start() 返回一个 Tab"
    这是为了人体工程学的**设计妥协**。理想情况下，`start()` 只会启动浏览器，用户会单独调用 `new_tab()`。但是，返回初始标签页减少了 90% 用例（单标签页自动化）的样板代码。权衡：即使在多标签页场景中也无法避免初始标签页。

### 上下文管理器协议

Browser 实现了 `__aenter__` 和 `__aexit__` 以自动清理：

```python
async def __aexit__(self, exc_type, exc_val, exc_tb):
    # 1. 恢复备份首选项（如果已修改）
    if self._backup_preferences_dir:
        shutil.copy2(self._backup_preferences_dir, ...)
    
    # 2. 检查浏览器是否仍在运行
    if await self._is_browser_running(timeout=2):
        await self.stop()
    
    # 3. 关闭 WebSocket 连接
    await self._connection_handler.close()
```

这确保即使在自动化期间发生异常也能正确清理。

## 浏览器上下文架构

浏览器上下文是 Pydoll 最复杂的隔离机制，在单个浏览器进程内提供**完整的浏览环境分离**。理解它们的架构对于高级自动化至关重要。

### CDP 层次结构：浏览器、上下文、目标

CDP 将浏览器结构组织为三个级别：

```mermaid
graph TB
    Browser[Browser Process]
    Browser --> DefaultContext[Default BrowserContext]
    Browser --> Context1[BrowserContext ID: abc-123]
    Browser --> Context2[BrowserContext ID: def-456]
    
    DefaultContext --> Target1[Target/Page ID: page-1]
    DefaultContext --> Target2[Target/Page ID: page-2]
    
    Context1 --> Target3[Target/Page ID: page-3]
    
    Context2 --> Target4[Target/Page ID: page-4]
    Context2 --> Target5[Target/Page ID: page-5]
```

**关键概念：**

1. **浏览器进程**：具有一个 CDP 端点的单个 Chromium 实例
2. **BrowserContext**：隔离的存储/缓存/权限边界（类似于无痕模式）
3. **目标**：单个页面、弹出窗口、worker 或后台目标

### 上下文隔离边界

每个浏览器上下文维护以下内容的**严格隔离**：

| 资源 | 隔离级别 | 实现 |
|----------|----------------|----------------|
| Cookies | 完全 | 每个上下文单独的 cookie jar |
| localStorage | 完全 | 每个上下文每个源单独的存储 |
| IndexedDB | 完全 | 每个上下文每个源单独的数据库 |
| 缓存 | 完全 | 每个上下文独立的 HTTP 缓存 |
| 权限 | 完全 | 上下文特定的权限授予 |
| 网络代理 | 完全 | 按上下文的代理配置 |
| 身份验证 | 完全 | 每个上下文独立的身份验证状态 |

!!! info "为什么上下文是轻量级的"
    与启动多个浏览器进程不同，上下文共享**渲染引擎、GPU 进程和网络栈**。只有存储和状态被隔离。这使得创建上下文比新浏览器实例快 10-100 倍。

### 上下文创建和目标绑定

创建上下文和目标涉及两个 CDP 命令：

```python
# 步骤 1：创建隔离的浏览上下文
response = await self._execute_command(
    TargetCommands.create_browser_context(
        proxy_server='http://proxy.example.com:8080',
        proxy_bypass_list='localhost,127.0.0.1'
    )
)
context_id = response['result']['browserContextId']

# 步骤 2：在该上下文中创建目标（页面）
response = await self._execute_command(
    TargetCommands.create_target(
        browser_context_id=context_id  # 将目标绑定到上下文
    )
)
target_id = response['result']['targetId']
```

**关键细节：**`browser_context_id` 参数**将目标绑定到上下文的隔离边界**。没有它，目标将在默认上下文中创建。

### 有头模式下的窗口实体化

在**有头模式**（可见 UI）中，浏览器上下文有一个重要的物理约束：

- 上下文最初仅存在于**内存中**（无窗口）
- 在上下文中创建的**第一个目标****必须**打开一个顶级窗口
- **后续目标**可以作为该窗口内的标签页打开

这是一个 **CDP/Chromium 限制**，而不是 Pydoll 的设计选择：

```python
# 上下文中的第一个目标：必须创建窗口
tab1 = await browser.new_tab(browser_context_id=context_id)  # 打开新窗口

# 后续目标：可以作为现有窗口中的标签页打开
tab2 = await browser.new_tab(browser_context_id=context_id)  # 作为标签页打开
```

**为什么这很重要？**

- 在**无头模式**中：完全无关（不渲染窗口）
- 在**有头模式**中：每个上下文的第一个目标将打开一个可见窗口
- 在**测试环境**中：多个上下文 → 多个窗口（可能会令人困惑）

!!! tip "无头上下文更干净"
    对于 CI/CD、抓取或批量自动化，请使用无头模式。上下文隔离的工作方式相同，但没有窗口实体化开销。

### 上下文删除和清理

删除上下文会**立即关闭其中的所有目标**：

```python
await browser.delete_browser_context(context_id)
# 此上下文中的所有标签页现已关闭
# 此上下文的所有存储已清除
# 上下文不能重用（ID 无效）
```

**清理序列：**

1. CDP 发送 `Target.disposeBrowserContext` 命令
2. 浏览器关闭该上下文中的所有目标
3. 浏览器清除该上下文的所有存储
4. 浏览器使上下文 ID 无效
5. Pydoll 从内部注册表中删除上下文

## 浏览器级别的事件系统

浏览器域支持跨所有标签页和上下文操作的**浏览器级事件监听器**。这与标签页级事件不同。

### 浏览器与标签页事件作用域

```python
# 浏览器级事件：适用于所有标签页
await browser.on('Target.targetCreated', handle_new_target)

# 标签页级事件：适用于一个标签页
await tab.on('Page.loadEventFired', handle_page_load)
```

**架构差异：**

- **浏览器事件**使用**浏览器级 WebSocket 连接**（基于端口或 `ws://host/devtools/browser/...`）
- **标签页事件**使用**标签页级 WebSocket 连接**（`ws://host/devtools/page/<target_id>`）

### Fetch 域：全局请求拦截

Fetch 域可以在**浏览器和标签页**两个级别启用，具有不同的作用域：

```python
# 浏览器级 Fetch：拦截所有标签页的请求
await browser.enable_fetch_events(handle_auth_requests=True)
await browser.on('Fetch.requestPaused', handle_request)

# 标签页级 Fetch：拦截一个标签页的请求
await tab.enable_fetch_events(handle_auth_requests=True)
await tab.on('Fetch.requestPaused', handle_request)
```

**何时使用每种方式：**

| 用例 | 级别 | 原因 |
|----------|-------|--------|
| 代理身份验证 | 浏览器 | 全局应用于所有上下文 |
| 广告拦截 | 浏览器 | 在所有标签页中拦截广告 |
| API 模拟 | 标签页 | 为特定测试模拟特定 API |
| 请求日志 | 标签页 | 仅记录相关标签页的请求 |

!!! warning "Fetch 性能影响"
    在浏览器级别启用 Fetch 会**暂停所有标签页的所有请求**，直到回调执行。这会为每个请求增加延迟。尽可能使用标签页级 Fetch 以最小化影响。

### 命令路由

所有 CDP 命令都通过浏览器的连接处理器流动：

```python
async def _execute_command(self, command, timeout=10):
    """
    将命令路由到适当的连接：
    - 浏览器级命令 → 浏览器 WebSocket
    - 标签页级命令 → 委托给 Tab 实例
    """
    return await self._connection_handler.execute_command(command, timeout)
```

这种集中式路由实现：

- **请求/响应关联**：通过 ID 匹配响应与请求
- **超时管理**：取消超过超时的命令
- **错误处理**：将 CDP 错误转换为 Python 异常

## 资源管理

### Cookie 和存储操作

浏览器域公开**浏览器级**和**上下文特定**的存储操作：

```python
# 浏览器级操作（所有上下文）
await browser.set_cookies(cookies)
await browser.get_cookies()
await browser.delete_all_cookies()

# 上下文特定操作
await browser.set_cookies(cookies, browser_context_id=context_id)
await browser.get_cookies(browser_context_id=context_id)
await browser.delete_all_cookies(browser_context_id=context_id)
```

这些操作在底层使用 **Storage 域**：

- `Storage.getCookies`：检索上下文或所有上下文的 cookie
- `Storage.setCookies`：使用域/路径/过期时间设置 cookie
- `Storage.clearCookies`：清除上下文或所有上下文的 cookie

!!! info "浏览器与标签页存储作用域"
    - **浏览器级**：对整个浏览器或特定上下文操作
    - **标签页级**：限定于标签页的当前源
    
    使用浏览器级进行全局 cookie 管理（例如，为所有域设置会话 cookie）。使用标签页级进行特定于源的操作（例如，注销后清除 cookie）。

### 权限授予

浏览器域提供**编程式权限控制**，绕过浏览器提示：

```python
await browser.grant_permissions(
    [PermissionType.GEOLOCATION, PermissionType.NOTIFICATIONS],
    origin='https://example.com',
    browser_context_id=context_id
)
```

**架构：**

- 通过 `Browser.grantPermissions` CDP 命令授予权限
- 权限是**上下文特定的**（每个上下文隔离）
- 授予会覆盖默认提示行为
- `reset_permissions()` 恢复到默认行为

### 下载管理

下载行为通过 `Browser.setDownloadBehavior` 命令配置：

```python
await browser.set_download_behavior(
    behavior=DownloadBehavior.ALLOW,
    download_path='/path/to/downloads',
    events_enabled=True,  # 发出下载进度事件
    browser_context_id=context_id
)
```

**选项：**

- `ALLOW`：保存到指定路径
- `DENY`：取消所有下载
- `DEFAULT`：显示浏览器的默认下载 UI

### 窗口管理

窗口操作应用于目标的**物理操作系统窗口**：

```python
window_id = await browser.get_window_id_for_target(target_id)
await browser.set_window_bounds({
    'left': 100, 'top': 100,
    'width': 1920, 'height': 1080,
    'windowState': 'normal'  # 或 'minimized'、'maximized'、'fullscreen'
})
```

**实现细节：**

- 使用 `Browser.getWindowForTarget` 从目标 ID 解析窗口 ID
- `Browser.setWindowBounds` 修改窗口几何形状
- **无头模式**：窗口操作是无操作的（不存在物理窗口）

## 架构洞察和设计权衡

### 单例标签页注册表：为什么？

标签页注册表模式（`_tabs_opened: dict[str, Tab]`）确保：

1. **事件路由正确工作**：CDP 事件包含 `targetId` 但没有 Tab 引用。注册表映射 `targetId` → `Tab` 以实现正确的回调分发。
2. **状态一致性**：引用同一目标的多个代码路径获得**相同的 Tab 实例**，防止状态分歧。
3. **内存效率**：没有注册表，`get_opened_tabs()` 会在每次调用时创建重复的 Tab 实例。

**权衡：**内存使用随标签页数量增长，但对于有状态的 Tab 实例这是不可避免的。

### 为什么 start() 返回一个 Tab

这个设计决策牺牲纯粹性以获得**人体工程学**：

- **缺点**：即使在多标签页自动化中也无法避免初始标签页
- **优点**：90% 的用户（单标签页脚本）不需要样板代码：

```python
# start() 返回 Tab
tab = await browser.start()

# 不返回（纯粹设计）
await browser.start()
tab = await browser.new_tab()
```

**探索的替代方案：**在 `new_tab()` 中自动关闭初始标签页。因为这是令人惊讶的行为（隐式副作用）而被拒绝。

### 代理身份验证：两级架构权衡

Pydoll 的代理身份验证使用两种不同的 Fetch 域策略：

**浏览器级（全局代理）：**
- **安全优势**：凭据永远不会记录在 CDP 跟踪中
- **性能成本**：Fetch 暂停**所有标签页的所有请求**，直到身份验证完成
- **效率**：默认上下文中所有标签页的单个监听器
- **缓解**：第一次身份验证后禁用 Fetch，最小化开销

**标签页级（按上下文代理）：**
- **安全优势**：凭据永远不会记录在 CDP 跟踪中
- **性能成本**：Fetch 暂停**该标签页的所有请求**，直到身份验证完成
- **效率**：每个标签页单独的监听器（效率较低，但对于隔离是必需的）
- **隔离优势**：每个上下文可以有不同的代理凭据
- **缓解**：每个标签页在第一次身份验证后禁用 Fetch

**为什么不使用 Browser.setProxyAuth？**这个 CDP 命令不存在。Fetch 是编程式身份验证的唯一机制。

**为什么对上下文使用标签页级？**CDP 的 Fetch 域不能限定到特定的 BrowserContext。由于每个上下文可以有不同的代理和不同的凭据，Pydoll 必须在标签页级别处理身份验证以尊重上下文边界。

### 端口随机化策略

随机 CDP 端口（9223-9322）防止并行运行浏览器实例时的冲突：

```python
self._connection_port = connection_port or randint(9223, 9322)
```

**为什么不从 9222 递增？**

- 多进程环境中的竞态条件（例如 pytest-xdist）
- 与用户的手动端口选择冲突

**权衡：**随机端口更难调试（无法硬编码）。解决方案：`browser._connection_port` 暴露所选端口。

### 组件分离：为什么使用管理器？

Browser 类委托给专门的管理器（ProcessManager、ProxyManager、TempDirManager、ConnectionHandler）以实现：

1. **可测试性**：管理器可以独立模拟
2. **可重用性**：ProxyManager 逻辑在 Browser 实现之间共享
3. **可维护性**：每个管理器都有单一职责
4. **跨平台**：特定于操作系统的逻辑在 ProcessManager 中隔离

**权衡：**更多的间接层次，但在规模上代码组织显著更好。

## 关键要点

1. **Browser 是一个协调器**，而不是单体。它协调管理器并处理 CDP 通信。
2. **标签页注册表确保单例实例**每个目标，对于事件路由和状态一致性至关重要。
3. **浏览器上下文是轻量级隔离**，共享浏览器进程但分离存储/缓存/身份验证。
4. **通过 Fetch 的代理身份验证**是一种安全权衡 - 隐藏凭据但增加延迟。
5. **事件系统有两个级别**：浏览器级和标签页特定，具有不同的 WebSocket 连接。
6. **组件分离**（管理器）改善了可测试性和跨平台支持。

## 相关文档

要深入了解相关架构组件：

- **[连接层](./connection-layer.md)**：WebSocket 通信、命令/响应流程、异步模式
- **[事件架构](./event-architecture.md)**：事件分发、回调管理、域启用
- **[标签页域](./tab-domain.md)**：标签页级操作、页面导航、元素查找
- **[CDP 深入探讨](./cdp.md)**：Chrome DevTools Protocol 基础
- **[代理架构](./proxy-architecture.md)**：网络级代理概念和实现

实际使用模式：

- **[标签页管理](../features/browser-management/tabs.md)**：多标签页自动化模式
- **[浏览器上下文](../features/browser-management/contexts.md)**：上下文隔离实践
- **[代理配置](../features/configuration/proxy.md)**：设置代理和身份验证


================================================
FILE: docs/zh/deep-dive/architecture/browser-requests-architecture.md
================================================
# 浏览器上下文请求架构

本文档探讨了 Pydoll 浏览器上下文 HTTP 请求系统的架构设计，该系统能够发起无缝继承浏览器会话状态、cookie 和身份验证的 HTTP 请求。

!!! info "提供实用指南"
    这是架构深入探讨。有关实际示例和用例，请参阅 [HTTP 请求指南](../features/network/http-requests.md)。

## 架构概述

浏览器上下文请求解决了混合自动化中的一个基本问题：在 UI 交互和 API 调用之间保持会话连续性。传统方法需要手动提取 cookie 和标头，在浏览器和 HTTP 客户端之间创建脆弱的耦合。

Pydoll 的架构通过在浏览器的 JavaScript 上下文**内部**执行 HTTP 请求来消除这种复杂性，同时利用 CDP 网络事件捕获 JavaScript 单独无法提供的全面元数据。

### 为什么选择这种架构？

| 传统方法 | Pydoll 架构 |
|---------------------|---------------------|
| 独立的 HTTP 客户端（requests、aiohttp） | 统一的基于浏览器的执行 |
| 手动 cookie 提取和同步 | 自动 cookie 继承 |
| 两个独立的会话状态 | 单一会话状态 |
| 有限的 CORS 处理 | 浏览器原生 CORS 强制执行 |
| 复杂的身份验证流程 | 透明的身份验证保留 |


## 组件架构

浏览器上下文请求系统由两个主要类组成，它们与 Pydoll 的事件系统协同工作：

```mermaid
classDiagram
    class Tab {
        +request: Request
        +enable_network_events()
        +disable_network_events()
        +get_network_response_body()
        +on(event_name, callback)
        +clear_callbacks()
    }
    
    class Request {
        -tab: Tab
        -_network_events_enabled: bool
        -_requests_sent: list
        -_requests_received: list
        +get(url, params, kwargs)
        +post(url, data, json, kwargs)
        +put(url, data, json, kwargs)
        +patch(url, data, json, kwargs)
        +delete(url, kwargs)
        +head(url, kwargs)
        +options(url, kwargs)
        -_execute_fetch_request()
        -_register_callbacks()
        -_extract_headers()
        -_extract_cookies()
    }
    
    class Response {
        -_status_code: int
        -_content: bytes
        -_text: str
        -_json: dict
        -_response_headers: list
        -_request_headers: list
        -_cookies: list
        -_url: str
        +ok: bool
        +status_code: int
        +text: str
        +content: bytes
        +url: str
        +headers: list
        +request_headers: list
        +cookies: list
        +json()
        +raise_for_status()
    }
    
    Tab *-- Request
    Request ..> Response : creates
    Request ..> Tab : uses events
```

### Request 类

`Request` 类作为接口层，提供类似 `requests` 的熟悉 API，同时协调 JavaScript 执行和网络事件监控之间的复杂交互。

**主要职责：**

- 将 Python 方法调用转换为 Fetch API JavaScript
- 管理临时网络事件监听器
- 在请求执行期间累积网络事件
- 从 CDP 事件中提取元数据
- 使用完整信息构造 Response 对象

### Response 类

`Response` 类提供与 `requests.Response` 兼容的接口，使从传统 HTTP 客户端迁移变得无缝。

**主要特性：**

- 多种内容访问器（文本、字节、JSON）
- 带缓存的延迟 JSON 解析
- 全面的标头信息（已发送和已接收）
- 从 Set-Cookie 标头提取 cookie
- 重定向后的最终 URL

## 执行流程

请求执行遵循六阶段管道：

```mermaid
flowchart TD
    Start([tab.request.get#40;url#41;]) --> Phase1[<b>1. 准备</b><br/>构建 URL + 选项]
    
    Phase1 --> Phase2[<b>2. 事件注册</b><br/>启用网络事件<br/>注册回调]
    
    Phase2 --> Phase3[<b>3. JavaScript 执行</b><br/>Runtime.evaluate&#40;fetch&#41;]
    
    Phase3 --> Phase4{<b>4. 网络活动</b>}
    Phase4 -->|请求已发送| Event1[REQUEST_WILL_BE_SENT]
    Phase4 -->|响应已接收| Event2[RESPONSE_RECEIVED]
    Phase4 -->|额外信息| Event3[*_EXTRA_INFO events]
    
    Event1 --> Collect[收集元数据]
    Event2 --> Collect
    Event3 --> Collect
    
    Collect --> Phase5[<b>5. 构造</b><br/>提取标头/cookie<br/>构建 Response 对象]
    
    Phase5 --> Phase6[<b>6. 清理</b><br/>清除回调<br/>禁用事件]
    
    Phase6 --> End([返回 Response])
```

### 阶段详情

| 阶段 | 层 | 关键操作 | 异步 |
|-------|-------|----------------|--------------|
| **1. 准备** | Request | URL 构建、选项格式化 | 否 |
| **2. 事件注册** | Tab | 启用事件、注册回调 | 是 |
| **3. JavaScript 执行** | CDP/Browser | 在浏览器上下文中执行 fetch() | 是 |
| **4. 网络活动** | Browser/CDP | HTTP 请求、发出 CDP 事件 | 是（并行） |
| **5. 构造** | Request | 解析事件、构建 Response | 否 |
| **6. 清理** | Tab | 删除回调、禁用事件 | 是 |

## 事件系统集成

浏览器上下文请求与 Pydoll 的事件系统架构紧密集成。理解这种关系至关重要。

### 临时事件生命周期

```mermaid
stateDiagram-v2
    [*] --> NoEvents: Request starts
    NoEvents --> EventsEnabled: Enable network events
    EventsEnabled --> CallbacksRegistered: Register callbacks
    CallbacksRegistered --> ExecutingRequest: Execute fetch
    ExecutingRequest --> CapturingEvents: Events fire
    CapturingEvents --> ExecutingRequest: More events
    ExecutingRequest --> CleaningUp: Fetch completes
    CleaningUp --> CallbacksRemoved: Clear callbacks
    CallbacksRemoved --> EventsDisabled: Disable if needed
    EventsDisabled --> [*]: Request complete
```

### 为什么同时使用 JavaScript 和事件？

一个常见问题：如果 JavaScript 可以执行请求，为什么要使用网络事件？

| 信息来源 | JavaScript（Fetch API） | 网络事件（CDP） |
|-------------------|------------------------|----------------------|
| 响应状态 | 可用 | 可用 |
| 响应正文 | 可用 | 不可用 |
| 响应标头 | 部分（CORS 受限） | 完整 |
| 请求标头 | 不可访问 | 完整 |
| Set-Cookie 标头 | 浏览器隐藏 | 可用 |
| 时序信息 | 有限 | 全面 |
| 重定向链 | 仅最终 URL | 完整链 |

**解决方案：** 结合两个来源以获取完整信息。

!!! tip "互补技术"
    JavaScript 提供响应正文并在浏览器上下文中触发请求（带有 cookie、身份验证）。网络事件提供 JavaScript 安全策略隐藏的元数据。

### CDP 网络事件类型

该架构使用四种 CDP 事件类型来捕获完整的元数据：

| 事件 | 目的 | 关键信息 |
|-------|---------|----------------|
| `REQUEST_WILL_BE_SENT` | 主要传出请求 | URL、方法、标准标头 |
| `REQUEST_WILL_BE_SENT_EXTRA_INFO` | 额外请求元数据 | 关联的 cookie、原始标头 |
| `RESPONSE_RECEIVED` | 主要响应已接收 | 状态、标头、MIME 类型、时序 |
| `RESPONSE_RECEIVED_EXTRA_INFO` | 额外响应元数据 | Set-Cookie 标头、安全信息 |

!!! info "事件多重性"
    单个 HTTP 请求生成多个 CDP 事件。Request 类累积所有相关事件，并在构造阶段提取非重复信息。

## 标头和 Cookie 架构

### 标头提取策略

标头存在于多个 CDP 事件中，可能存在重复。该架构使用去重策略：

```mermaid
flowchart TD
    A[Network Events] --> B{Event Type}
    B -->|REQUEST events| C[Extract Sent Headers]
    B -->|RESPONSE events| D[Extract Received Headers]
    
    C --> E[Deduplicate by name+value]
    D --> F[Deduplicate by name+value]
    
    E --> G[Request Headers List]
    F --> H[Response Headers List]
    
    G --> I[Response Object]
    H --> I
```

**去重逻辑：**

1. 按顺序处理事件
2. 每个标头由 `(name, value)` 元组标识
3. 仅保留每个元组的第一次出现
4. 结果：唯一、非冗余的标头列表

### Cookie 解析架构

Cookie 需要特殊处理，因为它们来自 `RESPONSE_RECEIVED_EXTRA_INFO` 事件中的 `Set-Cookie` 标头：

```mermaid
flowchart TD
    A[RESPONSE_RECEIVED_EXTRA_INFO] --> B[Extract Set-Cookie headers]
    B --> C{Multi-line header?}
    C -->|Yes| D[Split by newline]
    C -->|No| E[Parse single cookie]
    D --> F[Parse each line]
    F --> G[Extract name=value]
    E --> G
    G --> H{Valid name?}
    H -->|Yes| I[Create CookieParam]
    H -->|No| J[Discard]
    I --> K[Add to cookie list]
    K --> L[Deduplicate]
    L --> M[Response Object]
```

**Cookie 提取原则：**

- 只有 `EXTRA_INFO` 事件包含 `Set-Cookie` 标头
- 忽略 Cookie 属性（Path、Domain、Secure、HttpOnly）
- 浏览器在内部管理 cookie 属性
- 仅提取名称-值对以供参考

!!! warning "Cookie 范围"
    `Response.cookies` 属性仅包含来自此特定响应的**新的或更新的** cookie。现有浏览器 cookie 会自动管理，不会通过此接口公开。

## JavaScript 执行上下文

Fetch API 执行发生在浏览器的 JavaScript 上下文中，这是该架构强大功能的关键：

### Fetch API 集成

请求被转换为 JavaScript：

```javascript
// 简化表示
(async () => {
    const response = await fetch(url, {
        method: 'GET',
        headers: {'X-Custom': 'value'},
        // 浏览器自动添加：
        // - Cookie 标头
        // - 如果设置了 Authorization
        // - 标准标头（User-Agent、Accept 等）
    });
    
    return {
        status: response.status,
        url: response.url,  // 重定向后的最终 URL
        text: await response.text(),
        content: new Uint8Array(await response.arrayBuffer()),
        json: response.headers.get('Content-Type')?.includes('application/json')
            ? await response.clone().json()
            : null
    };
})()
```

### 浏览器上下文优势

在浏览器上下文中执行提供：

| 优势 | 描述 |
|---------|-------------|
| **自动 Cookie 包含** | 浏览器自动发送所有适用的 cookie |
| **身份验证状态保留** | 从浏览器会话维护身份验证标头 |
| **CORS 强制执行** | 浏览器应用与用户交互相同的 CORS 策略 |
| **TLS/SSL 处理** | 应用浏览器的证书验证和安全策略 |
| **压缩** | 自动处理 gzip、br、deflate |
| **重定向** | 浏览器透明地跟随重定向 |
| **相同安全上下文** | 请求与用户发起的请求完全相同 |

!!! info "反机器人检测"
    在浏览器上下文中执行的请求与用户发起的请求无法区分，使其对分析请求模式的反机器人系统有效。

## 性能考虑

### 事件开销

网络事件为请求执行增加了开销：

| 场景 | 开销 | 建议 |
|----------|----------|----------------|
| 单个请求 | 低 | 可接受 |
| 多个顺序请求 | 中等 | 启用一次事件 |
| 批量请求（100+） | 高 | 考虑在标签页级别启用事件 |
| 长时间运行的自动化 | 内存问题 | 完成后禁用 |

### 优化模式

```python
# 低效 - 事件反复启用/禁用
for url in urls:
    response = await tab.request.get(url)

# 高效 - 事件启用一次
await tab.enable_network_events()
for url in urls:
    response = await tab.request.get(url)
await tab.disable_network_events()
```

!!! tip "自动优化"
    Request 类检查网络事件是否已启用，并自动跳过冗余的启用/禁用操作。

### JSON 解析策略

Response JSON 解析使用带缓存的延迟评估：

1. 首次调用 `response.json()`：解析并缓存
2. 后续调用：返回缓存结果
3. 如果在构造期间预解析了 JSON：使用它

这可以防止冗余的解析开销。

## 安全架构

### CORS 策略强制执行

浏览器上下文请求遵守 CORS 策略：

```mermaid
flowchart TD
    A[tab.request.get&#40;url&#41;] --> B{Same Origin?}
    B -->|Yes| C[Request Allowed]
    B -->|No| D{CORS Headers Present?}
    D -->|Yes| E[Request Allowed]
    D -->|No| F[Request Blocked]
    
    C --> G[Response Returned]
    E --> G
    F --> H[CORS Error]
```

**CORS 行为：**

- 对同源的请求：始终允许
- 跨源请求：需要服务器的 CORS 标头
- 不透明响应：可能被浏览器阻止

**CORS 问题的解决方法：**

首先导航到域以建立同源上下文：

```python
await tab.go_to('https://different-domain.com')
response = await tab.request.get('https://different-domain.com/api')
```

### Cookie 安全

浏览器处理带有安全标志（`HttpOnly`、`Secure`、`SameSite`）的 Cookie：

- **HttpOnly cookie**：自动发送但不暴露给 JavaScript 或 CDP
- **Secure cookie**：仅通过 HTTPS 发送
- **SameSite cookie**：浏览器强制执行 SameSite 策略

由于这些安全限制，`Response.cookies` 属性可能不会显示所有 cookie。

### TLS/SSL 验证

浏览器验证 SSL 证书。自签名或无效证书会导致请求失败，除非：

```python
options = ChromiumOptions()
options.add_argument('--ignore-certificate-errors')
browser = Chrome(options=options)
```

!!! warning "安全权衡"
    禁用证书验证会降低安全性。仅在受控环境中使用。

## 限制和设计决策

### 请求正文大小

非常大的请求正文（文件、大型数据集）具有 JavaScript 内存约束。对于文件上传，请改用 `WebElement.set_input_files()` 或文件选择器拦截器。

### 二进制响应处理

二进制响应通过 JavaScript 的 `ArrayBuffer` 和 `Uint8Array` 转换，这会为非常大的响应（>100MB）增加一些开销。

### 重定向透明度

Fetch API 自动跟随重定向。仅捕获最终 URL。如果您需要重定向链，请单独使用网络监控。

### 事件时序

事件必须在执行 fetch **之前**注册。架构通过注册阶段确保这一点，但手动事件处理需要仔细的时序。

## 架构原则

浏览器上下文请求架构遵循以下原则：

1. **会话连续性**：永远不要破坏浏览器的会话状态
2. **零手动同步**：不需要 cookie/标头提取
3. **完整信息**：结合 JavaScript + 事件以获取完整元数据
4. **自动清理**：每个请求后释放资源
5. **熟悉的接口**：与 `requests` 兼容的 API，易于采用
6. **性能意识**：针对常见用例进行优化
7. **安全意识**：遵守浏览器安全策略

## 与其他系统的集成

### 事件系统依赖

浏览器上下文请求依赖于事件系统架构：

- 利用 `Tab.on()` 进行回调注册
- 使用 `Tab.clear_callbacks()` 进行清理
- 尊重现有的网络事件启用
- 与事件生命周期管理集成

详见[事件系统架构](event-architecture.md)。

### 类型系统集成

该架构广泛使用 Python 的类型系统：

- `HeaderEntry` TypedDict 用于标头
- `CookieParam` TypedDict 用于 cookie
- 来自 `pydoll.protocol.network.events` 的事件类型定义
- 提供 IDE 自动完成和类型安全

详见[类型系统](typing-system.md)。

## 进一步阅读

- **[HTTP 请求指南](../features/network/http-requests.md)** - 实际示例和用例
- **[事件系统架构](event-architecture.md)** - 事件系统内部设计
- **[网络监控](../features/network/monitoring.md)** - 被动网络观察
- **[请求拦截](../features/network/interception.md)** - 主动请求修改
- **[类型系统](typing-system.md)** - 类型系统集成

## 总结

Pydoll 的浏览器上下文请求架构通过结合 JavaScript Fetch API 执行和 CDP 网络事件监控来实现无缝 HTTP 通信。这种混合方法提供：

- 来自 JavaScript 和 CDP 事件的**完整元数据**
- 通过浏览器上下文执行实现**自动会话连续性**
- 与 requests 库兼容的**熟悉接口**
- 通过事件重用实现**性能优化**
- 符合浏览器策略的**安全合规性**

该架构展示了结合互补技术（JavaScript + CDP 事件）如何优雅地解决复杂问题，在不影响完整性或安全性的情况下提供强大功能和便利性。


================================================
FILE: docs/zh/deep-dive/architecture/event-architecture.md
================================================
# 事件系统架构

本文档探讨 Pydoll 事件系统的内部架构，涵盖 WebSocket 通信、事件流、回调管理和性能考虑。

!!! info "实用指南"
    有关实际示例和使用模式，请参阅 [事件系统指南](../features/advanced/event-system.md)。

## WebSocket 通信和 CDP

Pydoll 事件系统的核心是 Chrome DevTools Protocol（CDP），它提供了一种结构化的方式来通过 WebSocket 连接与浏览器活动进行交互和监控。这个双向通信通道允许你的代码向浏览器发送命令并接收事件。

```mermaid
sequenceDiagram
    participant Client as Pydoll Code
    participant Connection as ConnectionHandler
    participant WebSocket
    participant Browser
    
    Client->>Connection: Register callback for event
    Connection->>Connection: Store callback in registry
    
    Client->>Connection: Enable event domain
    Connection->>WebSocket: Send CDP command to enable domain
    WebSocket->>Browser: Forward command
    Browser-->>WebSocket: Acknowledge domain enabled
    WebSocket-->>Connection: Forward response
    Connection-->>Client: Domain enabled
    
    Browser->>WebSocket: Event occurs, sends CDP event message
    WebSocket->>Connection: Forward event message
    Connection->>Connection: Look up callbacks for this event
    Connection->>Client: Execute registered callback
```

### WebSocket 通信模型

Pydoll 和浏览器之间的 WebSocket 连接遵循以下模式：

1. **连接建立**：浏览器启动时，会创建一个 WebSocket 服务器，Pydoll 建立与其的连接
2. **双向消息传递**：Pydoll 和浏览器都可以随时发送消息
3. **消息类型**：
   - **命令**：从 Pydoll 发送到浏览器（例如导航、DOM 操作）
   - **命令响应**：浏览器响应命令发送给 Pydoll
   - **事件**：当浏览器发生某些事情时发送给 Pydoll（例如页面加载、网络活动）

### Chrome DevTools Protocol 结构

CDP 将其功能组织成域，每个域负责浏览器功能的特定区域：

| 域 | 职责 | 典型事件 |
|----|------|---------|
| Page | 页面生命周期 | 加载事件、导航、对话框 |
| Network | 网络活动 | 请求/响应监控、WebSockets |
| DOM | 文档结构 | DOM 变更、属性修改 |
| Fetch | 请求拦截 | 请求暂停、需要身份验证 |
| Runtime | JavaScript 执行 | 控制台消息、异常 |
| Browser | 浏览器管理 | 窗口创建、标签页、上下文 |

每个域必须在发出事件之前显式启用，这有助于通过仅处理实际需要的事件来管理性能。

## 域架构

### 启用/禁用模式

显式启用/禁用模式服务于几个重要的架构目的：

1. **性能优化**：通过仅启用你感兴趣的域，减少事件处理的开销
2. **资源管理**：某些事件域（如 Network 或 DOM 监控）可能产生大量消耗内存的事件
3. **协议合规**：CDP 要求在发出事件之前显式启用域
4. **受控清理**：显式禁用域确保在不再需要事件时进行适当的清理

```mermaid
stateDiagram-v2
    [*] --> Disabled: Initial State
    Disabled --> Enabled: enable_xxx_events()
    Enabled --> Disabled: disable_xxx_events()
    Enabled --> [*]: Tab Closed
    Disabled --> [*]: Tab Closed
```

!!! warning "事件泄漏防护"
    如果不再需要时未禁用事件域，可能导致内存泄漏和性能下降，特别是在长时间运行的自动化中。完成后始终禁用事件域，尤其是对于高容量事件（如网络监控）。

### 域特定的启用方法

不同的域通过适当对象上的特定方法启用：

| 域 | 启用方法 | 禁用方法 | 可用对象 |
|----|---------|---------|---------|
| Page | `enable_page_events()` | `disable_page_events()` | Tab |
| Network | `enable_network_events()` | `disable_network_events()` | Tab |
| DOM | `enable_dom_events()` | `disable_dom_events()` | Tab |
| Fetch | `enable_fetch_events()` | `disable_fetch_events()` | Tab, Browser |
| File Chooser | `enable_intercept_file_chooser_dialog()` | `disable_intercept_file_chooser_dialog()` | Tab |

!!! info "域所有权"
    事件根据其功能属于特定域。某些域仅在某些级别可用 - 例如，Page 事件在 Tab 实例上可用，但在 Browser 级别不直接可用。

## 事件注册系统

### `on()` 方法

订阅事件的核心方法是 `on()` 方法，在 Tab 和 Browser 实例上都可用：

```python
async def on(
    self, event_name: str, callback: callable, temporary: bool = False
) -> int:
    """
    注册事件监听器。

    Args:
        event_name (str): 要监听的事件名称。
        callback (callable): 事件触发时要执行的回调函数。
        temporary (bool): 如果为 True，回调将在触发一次后被删除。
            默认为 False。

    Returns:
        int: 已注册回调的 ID。
    """
```

此方法返回一个回调 ID，如果需要，可以稍后用于删除回调。

### 回调注册表

在内部，`ConnectionHandler` 维护一个回调注册表：

```python
{
    'Page.loadEventFired': [
        (callback_id_1, callback_function_1, temporary=False),
        (callback_id_2, callback_function_2, temporary=True),
    ],
    'Network.requestWillBeSent': [
        (callback_id_3, callback_function_3, temporary=False),
    ]
}
```

当事件通过 WebSocket 到达时：

1. 从消息中提取事件名称
2. 查询注册表以获取匹配的回调
3. 使用事件数据执行每个回调
4. 执行后删除临时回调

### 异步回调处理

回调可以是同步的或异步的。事件系统处理两者：

```python
async def _trigger_callbacks(self, event_name: str, event_data: dict):
    for cb_id, cb_data in self._event_callbacks.items():
        if cb_data['event'] == event_name:
            if asyncio.iscoroutinefunction(cb_data['callback']):
                await cb_data['callback'](event_data)
            else:
                cb_data['callback'](event_data)
```

异步回调按顺序等待。这意味着每个回调在下一个执行之前完成，这对以下方面很重要：

- **可预测的执行顺序**：回调按注册顺序执行
- **错误处理**：一个回调中的异常不会阻止其他回调执行
- **状态一致性**：回调可以依赖于顺序的状态更改

!!! info "顺序执行 vs 并发执行"
    回调在同一事件内顺序执行。但是，不同的事件可以并发处理，因为事件循环同时处理多个连接。

## 事件流和生命周期

事件生命周期遵循以下步骤：

```mermaid
flowchart TD
    A[Browser Activity] -->|Generates| B[CDP Event]
    B -->|Sent via WebSocket| C[ConnectionHandler]
    C -->|Filters by Event Name| D{Registered Callbacks?}
    D -->|Yes| E[Process Event]
    D -->|No| F[Discard Event]
    E -->|For Each Callback| G[Execute Callback]
    G -->|If Temporary| H[Remove Callback]
    G -->|If Permanent| I[Retain for Future Events]
```

### 详细流程

1. **浏览器活动**：浏览器中发生某些事情（页面加载、发送请求、DOM 变更）
2. **CDP 事件生成**：浏览器生成 CDP 事件消息
3. **WebSocket 传输**：消息通过 WebSocket 发送到 Pydoll
4. **事件接收**：ConnectionHandler 接收事件
5. **回调查找**：ConnectionHandler 在其注册表中检查与事件名称匹配的回调
6. **回调执行**：如果存在回调，则使用事件数据执行每个回调
7. **临时删除**：如果回调注册为临时回调，则在执行后将其删除

## 浏览器级别 vs 标签页级别事件

Pydoll 的事件系统在浏览器和标签页级别运行，具有重要的区别：

```mermaid
graph TD
    Browser[Browser Instance] -->|"Global Events (e.g., Target events)"| BrowserCallbacks[Browser-Level Callbacks]
    Browser -->|"Creates"| Tab1[Tab Instance 1]
    Browser -->|"Creates"| Tab2[Tab Instance 2]
    Tab1 -->|"Tab-Specific Events"| Tab1Callbacks[Tab 1 Callbacks]
    Tab2 -->|"Tab-Specific Events"| Tab2Callbacks[Tab 2 Callbacks]
```

### 浏览器级别事件

浏览器级别事件在所有标签页中全局操作。这些事件仅限于特定域，如：

- **Target 事件**：标签页创建、销毁、崩溃
- **Browser 事件**：窗口管理、下载协调

```python
# 浏览器级别事件注册
await browser.on('Target.targetCreated', handle_new_target)
```

浏览器级别的事件域是有限的，尝试使用标签页特定的事件将引发异常。

### 标签页级别事件

标签页级别事件特定于单个标签页：

```python
# 每个标签页都有自己的事件上下文
tab1 = await browser.start()
tab2 = await browser.new_tab()

await tab1.enable_page_events()
await tab1.on(PageEvent.LOAD_EVENT_FIRED, handle_tab1_load)

await tab2.enable_page_events()
await tab2.on(PageEvent.LOAD_EVENT_FIRED, handle_tab2_load)
```

此架构允许：

- **隔离的事件处理**：一个标签页中的事件不会影响其他标签页
- **每个标签页的配置**：不同的标签页可以监控不同的事件类型
- **资源效率**：仅在需要的标签页上启用事件

!!! info "域特定范围"
    并非所有事件域在两个级别都可用：
    
    - **Fetch 事件**：在浏览器和标签页级别都可用
    - **Page 事件**：仅在标签页级别可用
    - **Target 事件**：仅在浏览器级别可用

## 性能架构

### 事件系统开销

事件系统为浏览器自动化增加了开销，特别是对于高频事件：

| 事件域 | 典型事件量 | 性能影响 |
|--------|----------|---------|
| Page | 低 | 最小 |
| Network | 高 | 中等到高 |
| DOM | 非常高 | 高 |
| Fetch | 中等 | 中等（拦截时更高） |

### 性能优化策略

1. **选择性域启用**：仅启用你正在积极使用的事件域
2. **战略范围**：仅对真正的浏览器范围的问题使用浏览器级别事件
3. **及时禁用**：完成后始终禁用事件域
4. **早期过滤**：在回调中，尽早过滤掉无关的事件
5. **临时回调**：对一次性事件使用 `temporary=True` 标志

### 内存管理

事件系统通过几种机制管理内存：

1. **回调注册表清理**：删除回调释放其引用
2. **临时自动删除**：临时回调会自动清理
3. **域禁用**：禁用域会停止事件生成
4. **标签页关闭**：标签页关闭时，其所有回调会自动删除

!!! warning "内存泄漏防护"
    在长时间运行的自动化中，完成后始终清理回调并禁用域。高频事件（尤其是 DOM）如果保持启用状态，可能会累积大量内存。

## Connection Handler 架构

`ConnectionHandler` 是管理 WebSocket 通信和事件分发的核心组件。

### 关键职责

1. **WebSocket 管理**：建立和维护 WebSocket 连接
2. **消息路由**：区分命令响应和事件
3. **回调注册表**：维护事件名称到回调的映射
4. **事件分发**：事件到达时执行注册的回调
5. **清理**：删除回调并关闭连接

### 内部结构

```python
class ConnectionHandler:
    def __init__(self, ...):
        self._events_handler = EventsManager()
        self._websocket = None
        # ... other attributes
    
    async def register_callback(self, event_name, callback, temporary):
        return self._events_handler.register_callback(event_name, callback, temporary)

class EventsManager:
    def __init__(self):
        self._event_callbacks = {}  # Callback ID -> callback data
        self._callback_id = 0
    
    def register_callback(self, event_name, callback, temporary):
        self._callback_id += 1
        self._event_callbacks[self._callback_id] = {
            'event': event_name,
            'callback': callback,
            'temporary': temporary
        }
        return self._callback_id
    
    async def _trigger_callbacks(self, event_name, event_data):
        callbacks_to_remove = []
        
        for cb_id, cb_data in self._event_callbacks.items():
            if cb_data['event'] == event_name:
                # Execute callback (await if async, call directly if sync)
                if asyncio.iscoroutinefunction(cb_data['callback']):
                    await cb_data['callback'](event_data)
                else:
                    cb_data['callback'](event_data)
                
                # Mark temporary callbacks for removal
                if cb_data['temporary']:
                    callbacks_to_remove.append(cb_id)
        
        # Remove temporary callbacks after all callbacks executed
        for cb_id in callbacks_to_remove:
            self.remove_callback(cb_id)
```

此架构确保：

- **高效查找**：事件名称直接映射到回调列表
- **最小开销**：仅处理已注册的事件
- **自动清理**：临时回调在执行后被删除
- **线程安全**：操作是异步安全的

## 事件消息格式

CDP 事件遵循标准化的消息格式：

```json
{
    "method": "Network.requestWillBeSent",
    "params": {
        "requestId": "1234.56",
        "loaderId": "7890.12",
        "documentURL": "https://example.com",
        "request": {
            "url": "https://api.example.com/data",
            "method": "GET",
            "headers": {...}
        },
        "timestamp": 123456.789,
        "wallTime": 1234567890.123,
        "initiator": {...},
        "type": "XHR"
    }
}
```

关键组件：

- **`method`**：`Domain.eventName` 格式的事件名称
- **`params`**：事件特定数据，因事件类型而异
- **无 `id` 字段**：与命令不同，事件没有请求 ID

事件系统提取 `method` 字段以路由到适当的回调，将整个消息传递给每个回调。

## 多标签页事件协调

Pydoll 的架构支持复杂的多标签页事件协调：

### 独立标签页上下文

每个标签页维护自己的：

- 事件域启用状态
- 回调注册表
- 事件通信通道
- 网络日志（如果启用了网络事件）

!!! info "通信架构"
    每个标签页都有自己与浏览器的事件通信通道。有关 WebSocket 连接和目标 ID 在协议级别如何工作的技术细节，请参阅 [浏览器域架构](./browser-domain.md)。

### 共享浏览器上下文

多个标签页可以共享：

- 浏览器级别事件监听器
- Cookie 存储
- 缓存
- 浏览器进程

此架构允许：

1. **并行事件处理**：多个标签页可以同时处理事件
2. **隔离的故障**：一个标签页中的问题不会影响其他标签页
3. **资源共享**：高效共享常见的浏览器功能
4. **协调操作**：浏览器级别事件可以协调跨标签页活动

## 结论

Pydoll 的事件系统架构旨在：

- **性能**：通过选择性域启用和高效回调分发实现最小开销
- **灵活性**：支持浏览器级别和标签页级别事件
- **可扩展性**：使用独立的事件上下文处理多个标签页
- **可靠性**：自动清理和内存管理

理解此架构可以帮助你：

- **优化性能**：了解哪些域具有高开销
- **调试问题**：当事情不按预期工作时理解事件流
- **设计更好的自动化**：利用架构实现高效的事件驱动工作流
- **避免陷阱**：防止内存泄漏和性能下降

有关实际使用模式和示例，请参阅 [事件系统指南](../features/advanced/event-system.md)。


================================================
FILE: docs/zh/deep-dive/architecture/find-elements-mixin.md
================================================
# FindElements Mixin 架构

FindElementsMixin 代表了 Pydoll 中的一个关键架构决策：使用**组合优于继承**在 `Tab` 和 `WebElement` 之间共享元素查找能力，而不通过公共基类耦合它们。本文档探讨 mixin 模式、其实现以及元素定位的内部机制。

!!! info "实用使用指南"
    有关实际示例和使用模式，请参阅[元素查找指南](../features/automation/element-finding.md)和[选择器指南](./selectors-guide.md)。

## Mixin 模式：设计理念

### 什么是 Mixin？

Mixin 是一个旨在**向其他类提供方法**的类，而不是传统继承层次结构中的基类。与标准继承（建模"is-a"关系）不同，mixin 建模**"can-do"能力**。

```python
# 传统继承："is-a"
class Animal:
    def breathe(self): ...

class Dog(Animal):  # Dog IS-A Animal（狗是一种动物）
    def bark(self): ...

# Mixin 模式："can-do"
class FlyableMixin:
    def fly(self): ...

class Bird(Animal, FlyableMixin):  # Bird IS-A Animal, CAN fly（鸟是动物，能飞）
    pass
```

### 为什么使用 Mixin 而不是继承？

Pydoll 面临特定的架构挑战：

- **`Tab`** 需要在**文档上下文**中查找元素
- **`WebElement`** 需要**相对于自身**查找元素（子元素）
- 两者都需要**相同的选择器逻辑**（CSS、XPath、属性构建）

**选项 1：共享基类**

```python
class ElementLocator:
    def find(...): ...

class Tab(ElementLocator):
    pass

class WebElement(ElementLocator):
    pass
```

**问题：**
- 紧耦合：`Tab` 和 `WebElement` 现在共享继承层次结构
- 违反单一职责：`Tab` 不应该从与 `WebElement` 相同的类继承
- 难以扩展：添加新功能需要修改基类

**选项 2：Mixin 模式（选定方法）**

```python
class FindElementsMixin:
    def find(...): ...
    def query(...): ...

class Tab(FindElementsMixin):
    # Tab 特定逻辑
    pass

class WebElement(FindElementsMixin):
    # WebElement 特定逻辑
    pass
```

**优点：**

- **解耦**：`Tab` 和 `WebElement` 保持独立
- **可重用性**：两个类中使用相同的元素查找逻辑
- **可组合性**：可以添加其他 mixin 而不会冲突
- **可测试性**：Mixin 可以单独测试

!!! tip "Mixin 特性"
    1. **无状态**：Mixin 不维护自己的状态（没有 `__init__`）
    2. **依赖注入**：假定使用类提供依赖项（例如 `_connection_handler`）
    3. **单一目的**：每个 mixin 提供一个内聚的能力
    4. **不可实例化**：永远不要直接创建 `FindElementsMixin()`

## Pydoll 中的 Mixin 实现

### 类结构

FindElementsMixin 使用**依赖注入**与提供 `_connection_handler` 的任何类一起工作：

```python
class FindElementsMixin:
    """
    提供元素查找能力的 Mixin。
    
    假定使用类具有：
    - _connection_handler: 用于 CDP 命令的 ConnectionHandler 实例
    - _object_id: 用于上下文相对搜索的 Optional[str]（仅 WebElement）
    """
    
    if TYPE_CHECKING:
        _connection_handler: ConnectionHandler  # 类型提示，不是实际属性
    
    async def find(self, ...):
        # 实现使用 self._connection_handler
        # 检查 self._object_id 以确定上下文
```

**关键见解：** Mixin 不定义 `_connection_handler` 或 `_object_id`。它通过鸭子类型**假定**它们存在。

### Tab 和 WebElement 如何使用 Mixin

```python
# Tab：文档级搜索
class Tab(FindElementsMixin):
    def __init__(self, browser, target_id, connection_port):
        self._connection_handler = ConnectionHandler(connection_port)
        # 没有 _object_id → 从文档根开始搜索

# WebElement：元素相对搜索
class WebElement(FindElementsMixin):
    def __init__(self, object_id, connection_handler, ...):
        self._object_id = object_id  # CDP 对象 ID
        self._connection_handler = connection_handler
        # 有 _object_id → 相对于此元素搜索
```

**关键区别：**

- **Tab**：`hasattr(self, '_object_id')` → `False` → 使用 `RuntimeCommands.evaluate()`（文档上下文）
- **WebElement**：`hasattr(self, '_object_id')` → `True` → 使用 `RuntimeCommands.call_function_on()`（元素上下文）

### 上下文检测

Mixin 动态检测搜索上下文：

```python
async def _find_element(self, by, value, raise_exc=True):
    if hasattr(self, '_object_id'):
        # 相对搜索：在此元素上调用 JavaScript 函数
        command = self._get_find_element_command(by, value, self._object_id)
    else:
        # 文档搜索：在全局上下文中评估 JavaScript
        command = self._get_find_element_command(by, value)
    
    response = await self._execute_command(command)
    # ...
```

这个单一实现处理两者：

- `tab.find(id='submit')` → 搜索整个文档
- `form_element.find(id='submit')` → 在 `form_element` 内搜索

!!! warning "Mixin 依赖耦合"
    Mixin **紧密耦合**到 CDP 的对象模型。它假定：
    
    - 元素由 `objectId` 字符串表示
    - 文档搜索使用 `Runtime.evaluate()`
    - 元素相对搜索使用 `Runtime.callFunctionOn()`
    
    这是可以接受的，因为 Pydoll 是 **CDP 特定的**。更通用的设计需要抽象层。

## 公共 API 设计

Mixin 暴露两个具有不同设计理念的高级方法：

### find()：基于属性的选择

```python
@overload
async def find(self, find_all: Literal[False], ...) -> WebElement: ...

@overload
async def find(self, find_all: Literal[True], ...) -> list[WebElement]: ...

async def find(
    self,
    id: Optional[str] = None,
    class_name: Optional[str] = None,
    name: Optional[str] = None,
    tag_name: Optional[str] = None,
    text: Optional[str] = None,
    timeout: int = 0,
    find_all: bool = False,
    raise_exc: bool = True,
    **attributes,
) -> Union[WebElement, list[WebElement], None]:
```

**设计决策：**

1. **Kwargs 优于位置 By 枚举**：
   ```python
   # Pydoll（直观）
   await tab.find(id='submit', class_name='primary')
   
   # Selenium（冗长）
   driver.find_element(By.ID, 'submit')  # 不容易组合属性
   ```

2. **自动解析为最佳选择器**：
   - 单个属性 → 使用 `By.ID`、`By.CLASS_NAME` 等（最快）
   - 多个属性 → 构建 XPath（灵活但较慢）

3. **`**attributes` 用于扩展性**：
   ```python
   await tab.find(data_testid='submit-btn', aria_label='Submit form')
   # 构建：//\*[@data-testid='submit-btn' and @aria-label='Submit form']
   ```

### query()：基于表达式的选择

```python
@overload
async def query(self, expression, find_all: Literal[False], ...) -> WebElement: ...

@overload
async def query(self, expression, find_all: Literal[True], ...) -> list[WebElement]: ...

async def query(
    self, 
    expression: str, 
    timeout: int = 0, 
    find_all: bool = False, 
    raise_exc: bool = True
) -> Union[WebElement, list[WebElement], None]:
```

**设计决策：**

1. **自动检测 CSS vs XPath**：
   ```python
   # XPath 检测（以 / 或 ./ 开头）
   await tab.query("//div[@id='content']")
   
   # CSS 检测（默认）
   await tab.query("div#content > p.intro")
   ```

2. **单个表达式参数**（与 `find()` 不同）：
   - 假定用户知道选择器语法
   - 没有抽象开销

3. **直接传递到浏览器**：
   - CSS 使用 `querySelector()` / `querySelectorAll()`
   - XPath 使用 `document.evaluate()`

### 类型安全的重载模式

两种方法都使用 `@overload` 提供**精确的返回类型**：

```python
# IDE 知道返回类型是 WebElement
element = await tab.find(id='submit')

# IDE 知道返回类型是 list[WebElement]
elements = await tab.find(class_name='item', find_all=True)

# IDE 知道返回类型是 Optional[WebElement]
maybe_element = await tab.find(id='optional', raise_exc=False)
```

这对于 IDE 自动完成和类型检查至关重要。有关详细信息，请参阅[类型系统深入了解](./typing-system.md)。

## 选择器解析架构

Mixin 通过解析管道将用户输入转换为 CDP 命令：

| 阶段 | 输入 | 输出 | 关键决策 |
|-------|-------|--------|-------------|
| **1. 方法选择** | `find()` kwargs 或 `query()` 表达式 | 选择器策略 | 基于属性 vs 基于表达式 |
| **2. 策略解析** | 属性或表达式 | `By` 枚举 + 值 | 单个属性 → 原生方法，多个 → XPath |
| **3. 上下文检测** | `By` + 值 + `hasattr(_object_id)` | CDP 命令类型 | 文档 vs 元素相对搜索 |
| **4. 命令生成** | CDP 命令类型 + 选择器 | JavaScript + CDP 方法 | `evaluate()` vs `callFunctionOn()` |
| **5. 执行** | CDP 命令 | `objectId` 或 `objectId` 数组 | 通过 ConnectionHandler |
| **6. WebElement 创建** | `objectId` + 属性 | `WebElement` 实例 | 工厂函数避免循环导入 |

### 关键架构决策

**1. 单个 vs 多个属性**

```python
# 单个属性 → 直接选择器（快速）
await tab.find(id='username')  # 使用 By.ID → getElementById()

# 多个属性 → XPath（灵活）
await tab.find(tag_name='input', type='password', name='pwd')
# → //input[@type='password' and @name='pwd']
```

**为什么这很重要：**
- 原生方法（`getElementById`、`getElementsByClassName`）比 XPath 快 10-50%
- 组合属性时 XPath 开销可接受（无替代方案）

**2. 选择器类型的自动检测**

```python
await tab.query("//div")       # 以 / 开头 → XPath
await tab.query("#login")      # 默认 → CSS
```

**实现：**
```python
if expression.startswith(('./', '/', '(/')):
    return By.XPATH
return By.CSS_SELECTOR
```

启发式是**明确的** - CSS 选择器不能以 `/` 开头。

**3. XPath 相对路径调整**

对于元素相对搜索，绝对 XPath 必须转换：

```python
# 用户提供：//div
# 对于 WebElement：.//div（相对于元素，而不是文档）

def _ensure_relative_xpath(xpath):
    return f'.{xpath}' if not xpath.startswith('.') else xpath
```

没有这个，`element.find()` 将从文档根开始搜索。

## CDP 命令生成

Mixin 根据搜索上下文路由到不同的 CDP 方法：

| 上下文 | 选择器类型 | CDP 方法 | JavaScript 等价 |
|---------|--------------|------------|---------------------|
| 文档 | CSS | `Runtime.evaluate` | `document.querySelector()` |
| 文档 | XPath | `Runtime.evaluate` | `document.evaluate()` |
| 元素 | CSS | `Runtime.callFunctionOn` | `this.querySelector()` |
| 元素 | XPath | `Runtime.callFunctionOn` | `document.evaluate(..., this)` |

**关键见解：** `Runtime.callFunctionOn` 需要一个 `objectId`（要调用的元素），而 `Runtime.evaluate` 在全局范围内执行。

### JavaScript 模板

Pydoll 使用预定义的模板以保持一致性和性能：

```python
# CSS 选择器
Scripts.QUERY_SELECTOR = 'document.querySelector("{selector}")'
Scripts.RELATIVE_QUERY_SELECTOR = 'this.querySelector("{selector}")'

# XPath 表达式
Scripts.FIND_XPATH_ELEMENT = '''
    document.evaluate("{escaped_value}", document, null,
                      XPathResult.FIRST_ORDERED_NODE_TYPE, null).singleNodeValue
'''
```

模板避免运行时字符串连接并集中 JavaScript 代码。

## 对象 ID 解析和 WebElement 创建

CDP 将 DOM 节点表示为 **`objectId` 字符串**。Mixin 抽象了这一点：

**单个元素流程：**
1. 执行 CDP 命令 → 从响应中提取 `objectId`
2. 调用 `DOM.describeNode(objectId)` → 获取属性、标签名
3. 创建 `WebElement(objectId, connection_handler, attributes)`

**多个元素流程：**
1. 执行 CDP 命令 → 返回**作为单个远程对象的数组**
2. 调用 `Runtime.getProperties(array_objectId)` → 枚举数组索引
3. 为每个元素提取单独的 `objectId`
4. 描述并为每个创建 `WebElement`

**为什么使用 `Runtime.getProperties`？** CDP 不直接返回数组 - 它返回对数组对象的**引用**。我们必须枚举其属性以提取单个元素。

## 架构见解和设计权衡

### 为什么使用 Kwargs 而不是 By 枚举？

**Pydoll 的选择：**
```python
await tab.find(id='submit', class_name='primary')
```

**Selenium 的方法：**
```python
driver.find_element(By.ID, 'submit')  # 不能组合属性
```

**理由：**

- **可发现性**：IDE 自动完成显示所有可用参数
- **可组合性**：可以在一次调用中组合多个属性
- **可读性**：`id='submit'` 比 `(By.ID, 'submit')` 更直观

**权衡：** Kwargs 对选择器策略不够明确。通过文档和日志记录解决。

### 为什么自动检测 CSS vs XPath？

`_get_expression_type()` 启发式消除了用户负担：

```python
await tab.query("//div")       # 自动：XPath
await tab.query("#login")      # 自动：CSS
await tab.query("div > p")     # 自动：CSS
```

**优点：**

- **人体工程学**：用户不需要指定选择器类型
- **正确性**：不可能误用（使用 CSS 方法的 XPath，反之亦然）

**限制：** 无法强制对模糊选择器进行 CSS 解释（罕见的边缘情况）。

### 防止循环导入：create_web_element()

Mixin 使用**工厂函数**来避免循环导入：

```python
def create_web_element(*args, **kwargs):
    """在运行时动态导入 WebElement。"""
    from pydoll.elements.web_element import WebElement  # 延迟导入
    return WebElement(*args, **kwargs)
```

**为什么需要？**

- `FindElementsMixin` → 需要创建 `WebElement`
- `WebElement` → 从 `FindElementsMixin` 继承
- 循环依赖！

**解决方案：** 工厂函数内的延迟导入。导入仅在调用函数时执行，打破循环。

### hasattr() 进行上下文检测：优雅还是 Hacky？

Mixin 使用 `hasattr(self, '_object_id')` 检测 Tab vs WebElement：

```python
if hasattr(self, '_object_id'):
    # WebElement：元素相对搜索
else:
    # Tab：文档级搜索
```

**这是"hacky"吗？**

- **不**：这是**鸭子类型**（Pythonic 习语）
- Mixin 不需要知道类层次结构
- Tab 和 WebElement 都提供 `_connection_handler`
- WebElement 另外提供 `_object_id`

**替代方法：**

1. **类型检查**：`if isinstance(self, WebElement)` → 将 mixin 耦合到 WebElement
2. **抽象方法**：要求 Tab/WebElement 实现 `get_search_context()` → 更多样板代码
3. **依赖注入**：将上下文作为参数传递 → 破坏 API 人体工程学

**结论：** `hasattr()` 是此用例的最佳解决方案。

## 关键要点

1. **Mixin 实现代码共享**，而不通过继承耦合 `Tab` 和 `WebElement`
2. **通过鸭子类型进行上下文检测**（`hasattr`）使 mixin 与类层次结构解耦
3. **自动解析优化性能**，通过对单个属性使用原生方法
4. **XPath 构建提供可组合性**用于多属性查询
5. **基于轮询的等待很简单**，但以 CPU 周期换取实现简单性
6. **CDP 对象模型复杂性**隐藏在 WebElement 抽象后面
7. **通过重载实现类型安全**为 IDE 支持提供精确的返回类型

## 相关文档

要更深入地了解相关架构组件：

- **[类型系统](./typing-system.md)**：重载模式、TypedDict、泛型类型
- **[WebElement 域](./webelement-domain.md)**：WebElement 架构和交互方法
- **[选择器指南](./selectors-guide.md)**：CSS vs XPath 语法和最佳实践
- **[Tab 域](./tab-domain.md)**：Tab 级操作和上下文管理

有关实际使用模式：

- **[元素查找指南](../features/automation/element-finding.md)**：实际示例和模式
- **[类人交互](../features/automation/human-interactions.md)**：真实的元素交互


================================================
FILE: docs/zh/deep-dive/architecture/index.md
================================================
# 内部架构

**理解设计，然后有意识地打破规则。**

大多数文档向你展示框架**做什么**。本节揭示 Pydoll **如何**以及**为什么**以这种方式构建：塑造每一行代码的设计模式、架构决策和权衡。

## 为什么架构很重要

你可以在不理解其内部架构的情况下有效地使用 Pydoll。但当你需要：

- **调试**跨多个组件的复杂问题
- **优化**大规模自动化中的性能瓶颈
- **扩展** Pydoll 的自定义功能
- **贡献**对代码库的改进
- **构建**针对不同用例的类似工具

...架构知识变得**不可或缺**。

!!! quote "架构即语言"
    **"建筑是凝固的音乐。"** - 约翰·沃尔夫冈·冯·歌德
    
    良好的架构不仅仅是让代码工作，更是让代码**可理解**、**可维护**和**可扩展**。理解 Pydoll 的架构将教会你适用于每个项目的模式。

## 六大架构域

Pydoll 的架构组织为**六个内聚域**，每个域都有明确的职责和接口：

### 1. 浏览器域
**[→ 探索浏览器架构](./browser-domain.md)**

**协调者：管理进程、上下文和全局状态。**

浏览器域位于层次结构的顶部，协调：

- **进程管理**：启动/终止浏览器可执行文件
- **浏览器上下文**：隔离环境（如隐私窗口）
- **标签页注册表**：Tab 实例的单例模式
- **代理认证**：通过 Fetch 域自动认证
- **全局操作**：下载、权限、窗口管理

**关键架构模式**：

- **抽象基类**，适用于 Chrome/Edge/其他 Chromium 浏览器
- **管理器模式**（ProcessManager、ProxyManager、TempDirManager）
- **单例注册表**用于 Tab 实例（防止重复）
- **上下文管理器协议**用于自动清理

**关键洞察**：浏览器不直接操作页面，它**协调**低级组件。这种关注点分离使多浏览器支持和并发标签操作成为可能。

---

### 2. 标签页域
**[→ 探索标签页架构](./tab-domain.md)**

**主力军：执行命令、管理状态、协调自动化。**

标签页域是 Pydoll 的主要接口，处理：

- **导航**：具有可配置等待状态的页面加载
- **元素查找**：委托给 FindElementsMixin
- **JavaScript 执行**：页面和元素上下文
- **事件协调**：特定于标签页的事件监听器
- **网络监控**：请求/响应捕获和分析
- **IFrame 处理**：嵌套上下文管理

**关键架构模式**：

- **外观模式**：简化的 CDP 复杂操作接口
- **混入组合**：FindElementsMixin 用于元素定位
- **每标签页 WebSocket**：并行的独立连接
- **状态标志**：跟踪启用的域（network_events_enabled 等）
- **延迟初始化**：首次访问时创建请求对象

**关键洞察**：每个 Tab 拥有自己的 **ConnectionHandler**，实现跨标签的真正并行操作，无需竞争或状态泄漏。

---

### 3. WebElement 域
**[→ 探索 WebElement 架构](./webelement-domain.md)**

**交互器：连接 Python 代码和 DOM 元素。**

WebElement 域表示**单个 DOM 元素**，提供：

- **交互方法**：点击、输入、滚动、选择
- **属性访问**：文本、HTML、边界、属性
- **状态查询**：可见性、启用状态、值
- **截图**：特定于元素的图像捕获
- **子元素查找**：相对元素定位（也通过 FindElementsMixin）

**关键架构模式**：

- **代理模式**：表示远程浏览器元素的 Python 对象
- **对象 ID 抽象**：CDP 的 objectId 隐藏在 Python API 后面
- **混合属性**：同步（属性）vs 异步（动态状态）
- **命令模式**：交互方法包装 CDP 命令
- **回退策略**：多种方法提高鲁棒性

**关键洞察**：WebElement 维护**缓存的属性**（从创建时）和**动态状态**（按需获取），平衡性能与新鲜度。

---

### 4. FindElements 混入
**[→ 探索 FindElements 架构](./find-elements-mixin.md)**

**定位器：将选择器转换为 DOM 查询。**

FindElementsMixin 通过**组合**而非继承为 Tab 和 WebElement 提供元素查找功能：

- **基于属性的查找**：`find(id='submit', class_name='btn')`
- **基于表达式的查询**：`query('div.container > p')`
- **策略解析**：针对单个或多个属性的最优选择器
- **等待机制**：具有可配置超时的轮询
- **上下文检测**：文档 vs 元素相对搜索

**关键架构模式**：
- **混入模式**：无需继承层次结构的共享功能
- **策略模式**：基于输入的不同选择器策略
- **模板方法**：通用流程，特定于策略的实现
- **工厂函数**：延迟导入以避免循环依赖
- **重载模式**：类型安全的返回类型（WebElement vs list）

**关键洞察**：混入使用**鸭子类型**（`hasattr(self, '_object_id')`）来检测 Tab vs WebElement，实现代码重用而不紧密耦合。

---

### 5. 事件架构
**[→ 探索事件架构](./event-architecture.md)**

**调度器：将浏览器事件路由到 Python 回调。**

事件架构通过以下方式实现响应式自动化：

- **事件注册**：`on()` 方法订阅 CDP 事件
- **回调调度**：异步执行不阻塞
- **域管理**：显式启用/禁用以提高性能
- **临时回调**：首次调用后自动删除
- **多级作用域**：浏览器范围 vs 标签页特定事件

**关键架构模式**：

- **观察者模式**：订阅/通知事件驱动代码
- **注册表模式**：事件名称 → 回调列表映射
- **包装器模式**：自动包装同步回调以进行异步执行
- **清理协议**：标签页关闭时自动删除回调
- **作用域隔离**：每个标签页独立的事件上下文

**关键洞察**：事件是**推送式**的（浏览器通知 Python），而非轮询式，实现低延迟响应式自动化，无需忙等待。

---

### 6. 浏览器请求架构
**[→ 探索请求架构](./browser-requests-architecture.md)**

**混合体：具有浏览器会话状态的 HTTP 请求。**

浏览器请求系统连接 HTTP 和浏览器自动化：

- **会话连续性**：自动包含 Cookie 和认证
- **双重数据源**：JavaScript Fetch API + CDP 网络事件
- **完整元数据**：标头、Cookie、时间（并非所有通过 JavaScript 可用）
- **类 `requests` API**：具有浏览器能力的熟悉接口

**关键架构模式**：

- **混合执行**：JavaScript 获取主体，CDP 获取元数据
- **临时事件注册**：启用/捕获/禁用模式
- **延迟属性初始化**：首次使用时创建请求对象
- **适配器模式**：与浏览器 fetch 兼容的 Requests 接口

**关键洞察**：浏览器请求结合**两个信息源**（JavaScript 和 CDP 事件）。JavaScript 提供响应主体，CDP 提供 JavaScript 安全策略隐藏的标头和 Cookie。

---

## 架构原则

这六个域遵循一致的原则：

### 1. 关注点分离
每个域都有一个**单一、明确定义的职责**：

- Browser → 进程/上下文管理
- Tab → 命令执行和状态
- WebElement → 元素交互
- FindElements → 元素定位
- Events → 响应式调度
- Requests → 浏览器上下文中的 HTTP

**优势**：一个域的更改很少需要更改其他域。

### 2. 组合优于继承
Pydoll 使用以下方式而非深层继承层次结构：

- **混入**（Tab 和 WebElement 共享 FindElementsMixin）
- **管理器**（ProcessManager、ProxyManager、TempDirManager）
- **依赖注入**（ConnectionHandler 传递给组件）

**优势**：灵活的组件重用而不紧密耦合。

### 3. 默认异步
所有 I/O 操作都是 `async def` 并且必须 `await`：

- WebSocket 通信
- CDP 命令执行
- 事件回调调度
- 网络请求

**优势**：实现多个标签页的真正并发、并行操作和非阻塞 I/O。

### 4. 类型安全
每个公共 API 都有类型注解：

- 函数参数和返回类型
- 作为 `TypedDict` 的 CDP 响应
- 回调参数的事件类型
- 多态方法的重载

**优势**：IDE 自动完成、静态类型检查、自文档化代码。

### 5. 资源管理
上下文管理器确保清理：

- `async with Browser()` → 退出时关闭浏览器
- `async with tab.expect_file_chooser()` → 禁用拦截器
- `async with tab.expect_download()` → 清理临时文件

**优势**：自动资源清理，即使在异常情况下也能防止泄漏。

## 组件交互

理解域如何交互是关键：

```mermaid
graph TB
    User[你的 Python 代码]
    
    User --> Browser[浏览器域]
    User --> Tab[标签页域]
    User --> Element[WebElement 域]
    
    Browser --> ProcessMgr[进程管理器]
    Browser --> ContextMgr[上下文管理器]
    Browser --> TabRegistry[标签页注册表]
    
    Tab --> ConnHandler[连接处理器]
    Tab --> FindMixin[FindElements 混入]
    Tab --> EventSystem[事件系统]
    Tab --> RequestSystem[请求系统]
    
    Element --> ConnHandler2[连接处理器]
    Element --> FindMixin2[FindElements 混入]
    
    ConnHandler --> WebSocket[WebSocket 到 CDP]
    ConnHandler2 --> WebSocket
    EventSystem --> ConnHandler
    RequestSystem --> ConnHandler
    RequestSystem --> EventSystem
    
    WebSocket --> Chrome[Chrome 浏览器]
```

**关键交互**：

1. **Browser 创建 Tabs** → Tabs 存储在注册表中
2. **Tab 和 WebElement 都使用 FindElementsMixin** → 共享元素定位
3. **每个 Tab 拥有一个 ConnectionHandler** → 独立的 WebSocket 连接
4. **请求系统使用事件系统** → 网络事件捕获元数据
5. **所有组件都使用 ConnectionHandler** → 集中式 CDP 通信

## 先决条件

要充分受益于本节：

- **[核心基础](../fundamentals/cdp.md)** - 理解 CDP、异步和类型
- **Python 设计模式** - 熟悉常见模式
- **OOP 概念** - 类、继承、组合、接口
- **异步 Python** - 熟悉 `async def` 和 `await`  

**如果你还没有阅读基础知识**，请先从那里开始。架构建立在这些概念之上。

## 超越架构

掌握内部架构后，你将准备好：

- **贡献代码**：了解新功能的适配位置
- **性能优化**：识别瓶颈和低效率
- **自定义扩展**：基于 Pydoll 的模式构建
- **类似工具**：将这些模式应用于其他项目

## 设计哲学

良好的架构是**不可见的**，它不应该妨碍你。Pydoll 的架构优先考虑：

1. **简单性**：每个组件做好一件事
2. **一致性**：类似的操作有类似的模式
3. **明确性**：没有魔法，没有隐藏行为
4. **类型安全**：在设计时而非运行时捕获错误
5. **性能**：默认异步，无锁并行

这些不是任意选择，它们是几十年软件工程**经过实战检验的原则**。

---

## 准备好理解设计了吗？

从**[浏览器域](./browser-domain.md)**开始，了解进程管理和上下文隔离如何工作，然后按顺序浏览各个域。

**这是从使用到精通的转变。**

---

!!! success "完成架构学习后"
    一旦你理解了这些模式，你会在软件工程的各个地方看到它们，而不仅仅是 Pydoll。这些是应用于浏览器自动化的**通用模式**：
    
    - 外观模式（Tab 简化 CDP 复杂性）
    - 观察者模式（用于响应式代码的事件系统）
    - 混入模式（FindElementsMixin 用于代码重用）
    - 注册表模式（Browser 跟踪 Tab 实例）
    - 策略模式（FindElements 解析最优选择器）
    
    良好的架构是**永恒的知识**。


================================================
FILE: docs/zh/deep-dive/architecture/shadow-dom.md
================================================
# Shadow DOM 架构

Shadow DOM 是现代 Web 自动化中最具挑战性的方面之一。Shadow 树内的元素对常规 DOM 查询不可见，这打破了传统的自动化方法。本文档解释了 Shadow DOM 在浏览器层面的工作原理，为什么传统工具无法处理封闭的 shadow root，以及 Pydoll 如何通过直接的 CDP 访问绕过这些限制。

!!! info "实用指南"
    有关使用示例和快速入门模式，请参阅 [元素查找指南 — Shadow DOM 部分](../../features/element-finding.md#shadow-dom-支持)。

## 什么是 Shadow DOM？

Shadow DOM 是一项实现 **DOM 封装** 的 Web 标准。它允许组件拥有自己的隔离 DOM 树（"shadow 树"），附加到常规 DOM 元素（"shadow 宿主"）上。Shadow 树内的元素对主文档的查询是隐藏的。

```mermaid
graph TB
    subgraph "主 DOM（Light DOM）"
        Document["document"]
        Host["div#my-component\n(shadow 宿主)"]
        Other["p.normal-content"]
    end

    subgraph "Shadow 树（封装的）"
        SR["#shadow-root (open)"]
        Style["style"]
        Button["button.internal"]
        Input["input.private"]
    end

    Document --> Host
    Document --> Other
    Host -.->|"attachShadow()"| SR
    SR --> Style
    SR --> Button
    SR --> Input
```

### Shadow Root 模式

当组件通过 `attachShadow()` 创建 shadow root 时，它指定一个 **模式**：

| 模式 | JavaScript 访问 | CDP 访问 | 常见用途 |
|------|-----------------|----------|----------|
| `open` | `element.shadowRoot` 返回根节点 | 通过 `backendNodeId` 完全访问 | 自定义 Web 组件（Lit、Stencil） |
| `closed` | `element.shadowRoot` 返回 `null` | 通过 `backendNodeId` 完全访问 | 安全敏感组件、支付表单 |
| `user-agent` | 无法通过 JS 访问 | 有限访问 | 浏览器内部 UI（输入占位符、视频控件） |

这个区别至关重要：**JavaScript 级别的访问受模式限制，但 CDP 级别的访问不受限制。**

### 为什么传统自动化会失败

传统自动化工具依赖于在页面上下文中执行 JavaScript：

```javascript
// WebDriver / Selenium 方法
document.querySelector('#my-component')        // ✓ 找到宿主
document.querySelector('#my-component button') // ✗ 无法穿越 shadow 边界
element.shadowRoot                             // ✗ 对封闭根返回 null
```

Shadow 边界由浏览器的 JavaScript 引擎强制执行。任何通过执行 JavaScript 来查找元素的自动化工具都会遇到这道墙。这包括 Selenium、Playwright 的 `page.evaluate()`，以及任何在文档级别使用 `Runtime.evaluate()` 配合 `document.querySelector()` 的工具。

## Pydoll 如何绕过 Shadow 边界

Pydoll 的方法在 **JavaScript 之下** 的层级工作：Chrome DevTools Protocol。CDP 可以直接访问浏览器的内部 DOM 表示，完全忽略 shadow 模式限制。

### CDP 优势

```mermaid
sequenceDiagram
    participant User as 用户代码
    participant SR as ShadowRoot
    participant CH as ConnectionHandler
    participant CDP as Chrome CDP
    participant DOM as 浏览器 DOM

    User->>SR: shadow_root.query('.btn')
    SR->>SR: _get_find_element_command(object_id)
    SR->>CH: execute_command(Runtime.callFunctionOn)
    CH->>CDP: WebSocket 发送
    CDP->>DOM: 在 shadow root 对象上执行 querySelector
    DOM-->>CDP: 元素结果
    CDP-->>CH: 包含 objectId 的响应
    CH-->>SR: 元素数据
    SR-->>User: WebElement 实例
```

关键洞察在于 **shadow root 对象如何获取** 以及 **查询如何对其执行**：

1. **发现**：`DOM.describeNode` 配合 `pierce=true` 返回 shadow root 节点及其 `backendNodeId`，无论模式如何
2. **解析**：`DOM.resolveNode` 将 `backendNodeId` 转换为直接引用 shadow root 的 JavaScript `objectId`
3. **查询**：`Runtime.callFunctionOn` 在 shadow root 的 `objectId` 上执行 `this.querySelector()`；这之所以有效，是因为调用是在 **shadow root 对象本身** 上进行的，而不是从文档上下文

### 逐步解析：Shadow Root 访问

```mermaid
flowchart TD
    A["WebElement\n(shadow 宿主)"]
    B["shadowRoots[]\n包含 backendNodeId"]
    C["JavaScript objectId\n用于 shadow root"]
    D["ShadowRoot 实例"]
    E["WebElement\n(shadow 内部)"]

    A -->|"DOM.describeNode\ndepth=1, pierce=true"| B
    B -->|"DOM.resolveNode\nbackendNodeId"| C
    C -->|"创建 ShadowRoot\n使用 objectId"| D
    D -->|"find() / query()\n通过 callFunctionOn"| E
```

#### 步骤 1：描述宿主节点

```python
# Pydoll 发送此 CDP 命令：
{
    "method": "DOM.describeNode",
    "params": {
        "objectId": "<host-element-object-id>",
        "depth": 1,
        "pierce": true  # ← 这是关键标志
    }
}
```

`pierce` 参数告诉 CDP 在描述节点时穿越 shadow 边界。响应包含 shadow root 信息，无论 shadow root 的模式如何：

```json
{
    "result": {
        "node": {
            "nodeName": "DIV",
            "shadowRoots": [
                {
                    "nodeId": 0,
                    "backendNodeId": 5,
                    "shadowRootType": "closed",
                    "childNodeCount": 4
                }
            ]
        }
    }
}
```

!!! warning "nodeId 与 backendNodeId"
    当 DOM 域未显式启用时（这是 Pydoll 的默认设置以最小化开销），`nodeId` 始终为 `0`。`backendNodeId` 是稳定的、始终可用的标识符。Pydoll 专门使用 `backendNodeId` 进行 shadow root 解析，这就是为什么它不需要 `DOM.enable()` 就能工作。

#### 步骤 2：解析为 JavaScript 对象

```python
# 将 backendNodeId 转换为可用的 objectId：
{
    "method": "DOM.resolveNode",
    "params": {
        "backendNodeId": 5
    }
}
```

响应提供一个 `objectId`，即 JavaScript 对象空间中 shadow root 的句柄：

```json
{
    "result": {
        "object": {
            "objectId": "-2296764575741119861.1.3"
        }
    }
}
```

#### 步骤 3：在 Shadow Root 内查询

有了 shadow root 的 `objectId`，Pydoll 利用 `FindElementsMixin` 现有的相对搜索机制：

```python
# 当调用 ShadowRoot.query('.btn') 时：
{
    "method": "Runtime.callFunctionOn",
    "params": {
        "functionDeclaration": "function() { return this.querySelector(\".btn\"); }",
        "objectId": "-2296764575741119861.1.3"
    }
}
```

函数以 `this` 绑定到 shadow root 对象运行。由于 shadow root 原生实现了 `querySelector()` 和 `querySelectorAll()` 接口，CSS 选择器在 shadow 边界内自然工作。

## ShadowRoot 架构

### 设计决策：复用 FindElementsMixin

最关键的架构决策是让 `ShadowRoot` 继承 `FindElementsMixin`：

```python
class ShadowRoot(FindElementsMixin):
    def __init__(self, object_id, connection_handler, mode, host_element):
        self._object_id = object_id               # Shadow root CDP 引用
        self._connection_handler = connection_handler  # 用于 CDP 通信
        self._mode = mode                          # ShadowRootType 枚举
        self._host_element = host_element          # 返回宿主的引用
```

**为什么这能工作**：`FindElementsMixin._find_element()` 检查 `hasattr(self, '_object_id')`。当存在时，它使用 `RELATIVE_QUERY_SELECTOR`，即在引用的对象上调用 `this.querySelector()`。由于 shadow root 原生支持 `querySelector()`，使用 CSS 选择器的 `query()` 自动工作。`ShadowRoot` 上的 `_css_only = True` 标志阻止 `find()` 和使用 XPath 的 `query()`，会抛出 `NotImplementedError`。

```python
# FindElementsMixin 中的这一行启用了 shadow root 搜索：
elif hasattr(self, '_object_id'):
    command = self._get_find_element_command(by, value, self._object_id)
```

这意味着 `ShadowRoot` 继承了 `query()` 和 `find_or_wait_element()`。但是，`_css_only = True` 标志将使用限制为仅使用 CSS 选择器的 `query()`；`find()` 和 XPath 会抛出 `NotImplementedError`。

!!! tip "架构一致性"
    这与 `WebElement.find()` 在元素子节点内搜索的机制相同：`_object_id` 属性表示"相对于我搜索"而不是"搜索整个文档"。`ShadowRoot`、`WebElement` 和 `Tab` 通过 `FindElementsMixin` 共享完全相同的元素查找行为。

### 类关系

| 类 | 有 `_object_id` | 有 `_connection_handler` | 查找范围 |
|----|:-:|:-:|---|
| `Tab` | 否 | 是 | 整个文档 |
| `WebElement` | 是 | 是 | 元素子树内 |
| `ShadowRoot` | 是 | 是 | Shadow 树内 |

三者都继承自 `FindElementsMixin`。`_object_id` 的存在与否决定搜索是文档全局的还是限定在特定节点。

### 解析 Shadow Root：backendNodeId 策略

Pydoll 故意使用 `backendNodeId` 而不是 `nodeId` 进行 shadow root 解析：

| 属性 | `nodeId` | `backendNodeId` |
|------|----------|-----------------|
| 需要 `DOM.enable()` | 是 | 否 |
| 跨 describe 调用稳定 | 否（DOM 未启用时为 0） | 是 |
| 适用于 shadow root 解析 | 仅在 DOM 启用时 | 始终 |
| 性能开销 | 较高（DOM 域跟踪） | 无 |

通过依赖 `backendNodeId`，Pydoll 避免了启用 DOM 域的开销，同时保持可靠的 shadow root 访问。这是一个务实的选择：大多数自动化场景不需要 DOM 域的事件流，启用它会增加内存和处理开销来跟踪每次 DOM 变更。

## 封闭的 Shadow Root：为什么 CDP 访问有效

这是最常被问到的问题：**如果 `element.shadowRoot` 在 JavaScript 中对封闭的 shadow root 返回 `null`，CDP 怎么能访问它们？**

答案在于理解浏览器的架构：

```mermaid
graph TB
    subgraph "JavaScript 运行时"
        JS["JavaScript 代码"]
        API["Web APIs\n(shadowRoot 属性)"]
    end

    subgraph "浏览器内部"
        CDP_Layer["CDP 协议层"]
        DOM_Internal["内部 DOM 树"]
    end

    JS -->|"element.shadowRoot"| API
    API -->|"mode == 'closed'\n→ 返回 null"| JS
    CDP_Layer -->|"DOM.describeNode\npierce=true"| DOM_Internal
    DOM_Internal -->|"始终返回\n完整 shadow 树"| CDP_Layer
```

**JavaScript 访问** 经过 Web API 层，该层强制执行 shadow 模式限制。当 `mode='closed'` 时，API 返回 `null`；这是对网页代码的有意访问控制边界。

**CDP 访问** 在 Web API 层之下运行。它直接与浏览器的内部 DOM 表示通信。`closed` 模式限制是 **JavaScript 级别的策略**，不是 **DOM 级别的限制**。Shadow 树仍然存在于 DOM 中；它只是对 JavaScript 的视图隐藏了。

!!! info "安全影响"
    这是 DevTools Protocol 的设计意图。CDP 面向需要完全 DOM 访问的调试和自动化工具。`closed` 模式保护 shadow 内容免受同一页面上其他脚本（如第三方脚本）的访问，而不是来自浏览器调试接口的访问。这与浏览器 DevTools 能够在 Elements 面板中检查封闭 shadow root 的原因相同。

### 实际验证

你可以自己验证这个行为：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.dom.types import ShadowRootType

async def verify_closed_access():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('about:blank')

        # 通过 JavaScript 创建封闭的 shadow root
        await tab.execute_script("""
            const host = document.createElement('div');
            host.id = 'test-host';
            document.body.appendChild(host);
            const shadow = host.attachShadow({ mode: 'closed' });
            shadow.innerHTML = '<p class="secret">隐藏内容</p>';
        """)

        # JavaScript 无法访问：
        result = await tab.execute_script(
            "return document.getElementById('test-host').shadowRoot",
            return_by_value=True,
        )
        js_value = result['result']['result'].get('value')
        print(f"JS shadowRoot: {js_value}")  # None

        # 但 Pydoll 可以：
        host = await tab.find(id='test-host')
        shadow = await host.get_shadow_root()
        print(f"Shadow 模式: {shadow.mode}")  # ShadowRootType.CLOSED

        secret = await shadow.query('.secret')
        text = await secret.text
        print(f"内容: {text}")  # "隐藏内容"

asyncio.run(verify_closed_access())
```

## 嵌套 Shadow Root

Web 组件经常组合其他 Web 组件，创建多级 shadow 树：

```mermaid
graph TB
    subgraph "Light DOM"
        Host1["outer-component\n(shadow 宿主)"]
    end

    subgraph "外部 Shadow 树"
        SR1["#shadow-root (open)"]
        Host2["inner-component\n(shadow 宿主)"]
        P1["p.outer-text"]
    end

    subgraph "内部 Shadow 树"
        SR2["#shadow-root (closed)"]
        Button["button.deep-btn"]
        P2["p.inner-text"]
    end

    Host1 -.-> SR1
    SR1 --> P1
    SR1 --> Host2
    Host2 -.-> SR2
    SR2 --> P2
    SR2 --> Button
```

Pydoll 通过链式 `get_shadow_root()` 调用自然处理这种情况。每个 `ShadowRoot` 产生的 `WebElement` 实例本身也可以有 shadow root：

```python
outer_host = await tab.find(tag_name='outer-component')
outer_shadow = await outer_host.get_shadow_root()        # open

inner_host = await outer_shadow.query('inner-component')
inner_shadow = await inner_host.get_shadow_root()        # closed，仍然有效

deep_button = await inner_shadow.query('.deep-btn')
await deep_button.click()
```

每个层级遵循相同的 CDP 解析流程：`describeNode` 然后 `resolveNode` 然后带有 `_object_id` 的 `ShadowRoot` 然后通过 `callFunctionOn` 执行 `querySelector`。

## IFrame 内的 Shadow Root

一个常见的实际场景涉及跨域 iframe 内的 shadow root——例如 Cloudflare Turnstile 验证码。这结合了两种隔离机制：iframe 边界和 shadow 边界。

```mermaid
graph TB
    subgraph "主页面"
        Host["div.widget\n(shadow 宿主)"]
    end

    subgraph "Shadow 树"
        SR1["#shadow-root"]
        IFrame["iframe\n(跨域)"]
    end

    subgraph "IFrame (OOPIF)"
        Body["body"]
    end

    subgraph "IFrame Shadow 树"
        SR2["#shadow-root"]
        Button["label.checkbox"]
    end

    Host -.-> SR1
    SR1 --> IFrame
    IFrame -.->|"独立进程"| Body
    Body -.-> SR2
    SR2 --> Button
```

Pydoll 通过 **iframe 上下文传播** 透明地处理这种情况。当创建 `ShadowRoot` 时，它从宿主元素继承 iframe 路由上下文：

```python
# 完整链：主页面 → shadow root → iframe → shadow root → 元素
shadow_host = await tab.find(id='widget-container')
first_shadow = await shadow_host.get_shadow_root()

iframe = await first_shadow.query('iframe')
body = await iframe.find(tag_name='body')
second_shadow = await body.get_shadow_root()

# click() 正确工作——鼠标事件通过 OOPIF 会话路由
button = await second_shadow.query('label.checkbox')
await button.click()
```

### 上下文传播如何工作

跨域 iframe 在浏览器的独立进程中运行（Out-of-Process IFrame，即 OOPIF）。这些 iframe 的 CDP 命令必须通过专用的 `sessionId` 路由。Pydoll 自动在整个链中传播此路由上下文：

1. **IFrame 解析其上下文**：`iframe.find()` 建立包含 `session_id` 和 `session_handler` 的 `IFrameContext`
2. **子元素继承上下文**：在 iframe 内找到的元素接收 `IFrameContext`
3. **Shadow root 从宿主继承**：`ShadowRoot` 复制其宿主元素的 `_iframe_context`
4. **Shadow 内的元素从 shadow root 继承**：通过 `shadow.query()` 找到的元素接收传播的上下文
5. **命令正确路由**：`_execute_command()` 检测继承的上下文，并通过 OOPIF 会话路由 CDP 命令（包括 `click()` 的 `Input.dispatchMouseEvent`）

这意味着来自 `DOM.getBoxModel` 的坐标（相对于 iframe 视口）与发送到同一 OOPIF 会话的鼠标事件正确配对。

## 查找 Shadow Root：find_shadow_roots()

`Tab.find_shadow_roots()` 遍历整个 DOM 树以收集页面上找到的所有 shadow root。

### 工作原理

```
Tab.find_shadow_roots()
  ├─ DOM.getDocument(depth=-1, pierce=true)
  │   └─ 返回包含 shadowRoots 数组的完整 DOM 树
  ├─ 递归树遍历：_collect_shadow_roots_from_tree()
  │   ├─ 收集包含宿主 backendNodeId 的 shadowRoots 条目
  │   ├─ 递归遍历子节点
  │   └─ 遍历 contentDocument（同源 iframe）
  ├─ 对于每个 shadow root 条目：
  │   ├─ DOM.resolveNode(backendNodeId) → objectId
  │   └─ 解析宿主元素（尽力而为）
  └─ 返回 list[ShadowRoot] 包含宿主引用
```

### 超时：等待 Shadow Root

Shadow 宿主通常是异步注入的。`Tab.find_shadow_roots()` 接受 `timeout` 参数，每 0.5 秒轮询一次，直到找到至少一个 shadow root 或超时到期（抛出 `WaitElementTimeout`）。同样，`WebElement.get_shadow_root()` 也支持 `timeout` 来等待特定元素的 shadow root：

```python
# 等待最多 10 秒让 shadow root 出现
shadow_roots = await tab.find_shadow_roots(timeout=10)

# 等待特定元素的 shadow root
shadow = await element.get_shadow_root(timeout=5)
```

### 关键细节

- `DOM.getDocument` 中的 **`pierce=True`** 使浏览器在节点描述中包含 `shadowRoots` 数组，允许发现所有 shadow root 而无需逐个导航到每个宿主。
- **同源 iframe 内容** 通过 `contentDocument` 节点包含在树中。遍历会处理这些。
- 每个返回的 `ShadowRoot` 都有对其 `host_element` 的引用（通过 `DOM.resolveNode` 尽力解析）。

### 深度遍历：跨域 IFrame（OOPIF）

默认情况下，跨域 iframe（OOPIF）**不**包含在 DOM 树中——其内容存在于浏览器的独立进程中。传入 `deep=True` 以同时发现 OOPIF 内的 shadow root：

```python
shadow_roots = await tab.find_shadow_roots(deep=True, timeout=10)
```

当设置 `deep=True` 时，该方法执行额外步骤：

```
Tab.find_shadow_roots(deep=True)
  ├─ ...（如上所述的主文档遍历）...
  └─ _collect_oopif_shadow_roots()
      ├─ 浏览器级别的 ConnectionHandler（无 page_id → 浏览器端点）
      ├─ Target.getTargets() → 过滤 type='iframe'
      └─ 对于每个 iframe 目标：
          ├─ Target.attachToTarget(targetId, flatten=True) → sessionId
          ├─ DOM.getDocument(depth=-1, pierce=True) 带 sessionId
          ├─ _collect_shadow_roots_from_tree() 在 OOPIF DOM 上执行
          └─ 对于找到的每个 shadow root：
              ├─ DOM.resolveNode(backendNodeId) 带 sessionId
              ├─ 解析宿主元素（尽力而为）带 sessionId
              ├─ 创建 IFrameContext(frame_id, session_handler, session_id)
              └─ 在宿主元素上设置 IFrameContext（或直接在 ShadowRoot 上设置）
```

返回的 `ShadowRoot` 对象携带 OOPIF 路由上下文（`IFrameContext`），因此通过 `shadow_root.query()` 找到的元素会自动通过正确的 OOPIF 会话路由 CDP 命令。这对于 Cloudflare Turnstile 验证码等场景至关重要，其中复选框位于跨域 iframe 内的封闭 shadow root 中。

## 限制和边界情况

### Shadow Root 内的选择器策略

!!! warning "在 Shadow Root 内仅使用 query() 配合 CSS"
    `ShadowRoot` 设置了 `_css_only = True`，这意味着仅支持使用 CSS 选择器的 `query()`。`find()` 和使用 XPath 的 `query()` 会抛出 `NotImplementedError`。

Shadow root 原生实现了 `querySelector()` 和 `querySelectorAll()`，使 CSS 选择器成为自然且可靠的选择：

| 方法 | Shadow Root 内 | 说明 |
|------|:--:|---|
| `query('css选择器')` | 完全支持 | 推荐方法 |
| `query('css选择器', find_all=True)` | 完全支持 | 返回元素列表 |
| `find()` | 不支持 | 抛出 `NotImplementedError` |
| `query('//xpath')` | 不支持 | 抛出 `NotImplementedError` |

```python
shadow = await host.get_shadow_root()

# ✓ 推荐：query() 配合 CSS 选择器
button = await shadow.query('button.submit')
email = await shadow.query('#email-input')
items = await shadow.query('.item', find_all=True)

# ✗ 不支持：find() 和 XPath 抛出 NotImplementedError
# shadow.find(id='email-input')        # NotImplementedError
# shadow.query('//button')             # NotImplementedError
```

### XPath 无法穿越 Shadow 边界

从文档根开始的 XPath 表达式无法穿越 shadow 边界。这是 XPath 的根本限制，因为它在 Shadow DOM 出现之前就被设计了：

```python
# 无法找到 shadow 内容：文档级 XPath 无法穿越边界
element = await tab.find(xpath='//div[@id="host"]//button')
```

### User-Agent Shadow Root

浏览器内部的 shadow root（如 `<input>` 占位符样式、`<video>` 控件）类型为 `user-agent`。它们可以通过 CDP 访问，但其内部结构因浏览器版本而异，不属于任何 Web 标准。

```python
input_element = await tab.find(tag_name='input')
try:
    ua_shadow = await input_element.get_shadow_root()
    # ua_shadow.mode == ShadowRootType.USER_AGENT
    # 内部结构是浏览器特定的
except ShadowRootNotFound:
    pass  # 并非所有 input 都有 user-agent shadow root
```

!!! warning "User-Agent Shadow Root 稳定性"
    不要构建依赖 user-agent shadow root 内部结构的自动化逻辑。它们的 DOM 结构是实现细节，可能在浏览器版本之间无通知地更改。

### 过期的 Shadow Root 引用

如果宿主元素从 DOM 中移除后重新添加（在单页应用中很常见），shadow root 的 `objectId` 将变为过期。解决方案是重新获取 shadow root：

```python
# 页面导航或 DOM 重建后：
host = await tab.find(id='my-component', timeout=5)  # 重新查找宿主
shadow = await host.get_shadow_root()                 # 新的 shadow root
```

## 关键要点

- **Shadow DOM 封装** 隐藏元素不被文档级 `querySelector()` 发现，破坏传统自动化
- **CDP 在 JavaScript API 层之下运行**，完全绕过 shadow 模式限制
- **`backendNodeId`** 是用于 shadow root 解析的稳定标识符，避免了启用 DOM 域的需要
- **`ShadowRoot` 继承 `FindElementsMixin`**，带有 `_css_only = True`，仅支持使用 CSS 选择器的 `query()`；`find()` 和 XPath 抛出 `NotImplementedError`
- **封闭的 shadow root** 完全可访问，因为 `closed` 模式是 JavaScript 级别的策略，不是 DOM 级别的限制
- **嵌套 shadow root** 通过在每个层级链式调用 `get_shadow_root()` 自然工作
- **IFrame 内的 shadow root** 通过自动 iframe 上下文传播透明地工作
- **使用 CSS 选择器**（`query()`）在 shadow root 内查找元素；`find()` 和 XPath 不受支持
- **`find_shadow_roots()`** 发现页面上的所有 shadow root；支持 `timeout` 进行轮询和 `deep=True` 用于跨域 iframe（OOPIF）
- **`get_shadow_root(timeout)`** 等待特定元素的 shadow root 出现

## 相关文档

- **[元素查找指南](../../features/element-finding.md)**：`find()`、`query()` 和 shadow root 访问的实际用法
- **[IFrame 与上下文](../fundamentals/iframes-and-contexts.md)**：Pydoll 如何解析和路由命令到 iframe，包括 OOPIF 处理
- **[FindElements Mixin 架构](./find-elements-mixin.md)**：`_object_id` 机制如何实现作用域搜索
- **[WebElement 域](./webelement-domain.md)**：元素如何与 CDP 交互
- **[连接层](../fundamentals/connection-layer.md)**：与浏览器的 WebSocket 通信


================================================
FILE: docs/zh/deep-dive/architecture/tab-domain.md
================================================
# Tab 域架构

Tab 域是 Pydoll 浏览器自动化的主要接口，充当编排层，将多个 CDP 域集成到一个内聚的 API 中。本文档探讨其内部架构、设计模式以及塑造其行为的工程决策。

!!! info "实际用法"
    有关使用示例和实际模式，请参阅 [Tab 管理指南](../features/automation/tabs.md)。

## 架构概述

`Tab` 类充当 Chrome DevTools Protocol 的**外观**，将多域协调的复杂性抽象为统一的接口。

### 组件结构

| 组件 | 关系 | 目的 |
|-----------|-------------|---------|
| **Tab** | 核心类 | 主要自动化接口 |
| ↳ **ConnectionHandler** | 组合（拥有） | 与 CDP 的 WebSocket 通信 |
| ↳ **Browser** | 引用（父级） | 访问浏览器级别的状态和配置 |
| ↳ **FindElementsMixin** | 继承 | 元素定位能力 |
| ↳ **WebElement** | 工厂（创建） | 单个 DOM 元素表示 |

### CDP 域集成

`ConnectionHandler` 将 Tab 操作路由到多个 CDP 域：

```
Tab 方法                CDP 域            目的
━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
go_to(), refresh()     →   Page            →  导航和生命周期
execute_script()       →   Runtime         →  JavaScript 执行
find(), query()        →   Runtime/DOM     →  元素定位
get_cookies()          →   Storage         →  会话状态
enable_network_events()→   Network         →  流量监控
enable_fetch_events()  →   Fetch           →  请求拦截
```

### 核心职责

1. **CDP 命令路由**：将高级操作转换为特定域的 CDP 命令
2. **状态管理**：跟踪启用的域、活动回调和会话状态
3. **事件协调**：将 CDP 事件桥接到用户定义的回调
4. **元素工厂**：从 CDP `objectId` 字符串创建 `WebElement` 实例
5. **生命周期管理**：处理清理和资源释放

## 组合与继承：FindElementsMixin

Tab 域中的一个关键架构决策是**从 `FindElementsMixin` 继承**而不是使用组合：

```python
class Tab(FindElementsMixin):
    def __init__(self, ...):
        self._connection_handler = ConnectionHandler(...)
        # Mixin 方法现在在 Tab 上可用
```

**为什么这里使用继承？**

| 方法 | 优点 | 缺点 | Pydoll 的选择 |
|----------|------|------|-----------------|
| **继承** | 简洁的 API（`tab.find()`）、类型兼容性 | 紧密耦合 | 使用 |
| 组合 | 松散耦合、灵活 | 冗长（`tab.finder.find()`）、包装器开销 | 未使用 |

**理由：** mixin 模式是合理的，因为：

- 元素查找是 **Tab 身份的核心**（每个标签页都可以查找元素）
- mixin 是**无状态的** - 它只需要 `_connection_handler`（通过鸭子类型的依赖注入）
- API 人体工程学很重要 - `tab.find()` 比 `tab.elements.find()` 更直观

详见 [FindElements Mixin 深入探讨](./find-elements-mixin.md) 的架构细节。

## 状态管理架构

Tab 类管理**多层状态**：

###  1. 域启用标志

```python
class Tab:
    def __init__(self, ...):
        self._page_events_enabled = False
        self._network_events_enabled = False
        self._fetch_events_enabled = False
        self._dom_events_enabled = False
        self._runtime_events_enabled = False
        self._intercept_file_chooser_dialog_enabled = False
```

**为什么使用显式标志？**

- **幂等性**：两次调用 `enable_page_events()` 不会重复注册
- **状态检查**：`tab.page_events_enabled` 等属性公开当前状态
- **清理跟踪**：知道在标签页关闭时需要禁用哪些域

**替代方案（未使用）：** 每次检查时查询 CDP 以获取启用的域 → 太慢，增加延迟。

### 2. 目标标识

```python
self._target_id: str              # 唯一的 CDP 标识符
self._browser_context_id: Optional[str]  # 隔离上下文
self._connection_port: int        # WebSocket 端口
```

**设计决策：** `target_id` 是**主要标识符**，而不是 Tab 实例本身。这使得：

- **浏览器级别的 Tab 注册表**：`Browser._tabs_opened[target_id] = tab`
- **单例模式**：相同的 `target_id` 始终返回相同的 `Tab` 实例
- **连接重用**：同一标签页上的多个操作共享 WebSocket

### 3. 特定功能状态

```python
self._cloudflare_captcha_callback_id: Optional[int] = None  # 用于清理
self._request: Optional[Request] = None  # 延迟初始化
```

**延迟初始化模式：** `Request` 仅在访问 `tab.request` 时创建：

```python
@property
def request(self) -> Request:
    if self._request is None:
        self._request = Request(self)
    return self._request
```

**为什么延迟？** 大多数自动化不使用浏览器上下文 HTTP 请求。节省内存和初始化时间。


## JavaScript 执行：双上下文架构

`execute_script()` 方法实现**上下文多态性** - 相同的接口，不同的 CDP 命令：

| 上下文 | CDP 方法 | 用例 |
|---------|-----------|----------|
| 全局（无元素） | `Runtime.evaluate` | `document.title`、全局脚本 |
| 元素绑定 | `Runtime.callFunctionOn` | 元素特定操作 |

**关键架构决策：** 基于 `element` 参数的存在自动检测执行模式，消除了单独的 API（`evaluate()` 与 `call_function_on()`）。

**脚本转换管道：**

1. 替换 `argument` → `this`（Selenium 兼容性）
2. 检测脚本是否已包装在 `function() { }` 中
3. 如果需要则包装：`script` → `function() { script }`
4. 路由到适当的 CDP 命令

**为什么使用 `argument` 关键字？** 为 Selenium 用户提供迁移路径，API 熟悉度。

!!! info "实际用法"
    有关真实世界的脚本执行模式，请参阅[类人交互](../features/automation/human-interactions.md)。

## 事件系统集成

Tab 充当 ConnectionHandler 事件系统的**薄包装器**，但添加了重要的一层：**非阻塞回调执行**。

```python
async def on(self, event_name: str, callback: Callable, temporary: bool = False) -> int:
    # 包装异步回调以在后台执行
    async def callback_wrapper(event):
        asyncio.create_task(callback(event))
    
    if asyncio.iscoroutinefunction(callback):
        function_to_register = callback_wrapper  # 非阻塞包装器
    else:
        function_to_register = callback  # 同步回调直接执行
    
    # 将注册委托给 ConnectionHandler
    return await self._connection_handler.register_callback(
        event_name, function_to_register, temporary
    )
```

**架构角色：** Tab 提供具有非阻塞执行语义的标签页作用域事件注册，而 ConnectionHandler 处理 WebSocket 管道和顺序回调调用。

**关键特性：**

- 通过 `asyncio.create_task()` 为异步回调提供**后台执行**（即发即忘）
- **同步/异步回调自动检测**
- **临时回调**用于一次性处理程序
- **回调 ID** 用于显式删除

**执行模型：**

| 层 | 行为 | 目的 |
|-------|----------|---------|
| **用户回调** | 在后台任务中运行 | 永远不会阻塞其他回调或 CDP 命令 |
| **Tab 包装器** | `create_task(callback())` | 启动后台任务，立即返回 |
| **EventsManager** | `await wrapper()` | 按顺序调用同一事件的包装器 |

**为什么需要包装器？** 没有它，一个慢速异步回调会阻塞同一事件的其他回调。`create_task` 包装器确保所有回调"同时"启动（在单独的任务中），防止一个慢速回调延迟其他回调。

!!! info "详细架构"
    有关内部事件路由机制和 EventsManager 的顺序调用模式，请参阅[事件架构深入探讨](./event-architecture.md)。
    
    **实际用法：** [事件系统指南](../features/advanced/event-system.md)

## 会话状态：Cookie 管理

**架构分离：** Cookie 路由到 **Storage 域**（操作），而不是 Network 域（观察）。

```python
async def set_cookies(self, cookies: list[CookieParam]):
    return await self._execute_command(
        StorageCommands.set_cookies(cookies, self._browser_context_id)
    )
```

**上下文感知设计：** `browser_context_id` 参数确保 cookie 隔离，实现多账户自动化。

!!! info "实际 Cookie 管理"
    有关使用模式和反检测策略，请参阅 [Cookie 与会话指南](../features/browser-management/cookies-sessions.md)。

## 内容捕获：CDP 目标限制

**关键限制：** `Page.captureScreenshot` 仅适用于**顶级目标**。Iframe 标签页静默失败（响应中没有 `data` 字段）。

```python
try:
    screenshot_data = response['result']['data']
except KeyError:
    raise TopLevelTargetRequired(...)  # 引导用户使用 WebElement.take_screenshot()
```

**设计影响：** 旧版本会为 iframe 创建独立的 Tab。现在 iframe 直接作为 `WebElement` 处理，因此需要在框内元素上执行操作，例如 `await iframe_element.find(...).take_screenshot()`。

**PDF 生成：** `Page.printToPDF` 返回 base64 编码的数据。Pydoll 抽象文件 I/O，但底层数据始终是 base64（CDP 规范）。

!!! info "实际用法"
    有关参数、格式和真实世界示例，请参阅[屏幕截图和 PDF 指南](../features/automation/screenshots-and-pdfs.md)。

## 网络监控：有状态设计

**架构原则：** 网络方法需要**启用状态** - 运行时检查防止访问不存在的数据。

**存储分离：**

- **日志**：在 `ConnectionHandler` 中缓冲（接收所有 CDP 事件）
- **Tab**：查询处理程序，无重复存储
- **响应正文**：通过 `Network.getResponseBody(requestId)` 按需检索

**关键时序约束：** 响应正文必须在响应后**约 30 秒内**获取（浏览器垃圾回收）。

!!! info "实际网络监控"
    有关全面的事件跟踪和分析模式，请参阅[网络监控指南](../features/network/monitoring.md)。
    
    **请求拦截：** [请求拦截指南](../features/network/interception.md)

## 对话框管理：事件捕获模式

**关键 CDP 行为：** JavaScript 对话框**阻塞所有 CDP 命令**直到处理。

**架构解决方案：** `ConnectionHandler` 立即捕获 `Page.javascriptDialogOpening` 事件，防止自动化挂起。

```python
# 处理程序在用户代码运行之前存储对话框事件
self._connection_handler.dialog  # 由处理程序捕获
# Tab 查询存储的事件
async def has_dialog(self) -> bool:
    return bool(self._connection_handler.dialog)
```

**为什么选择这种设计？** 事件在用户回调执行之前触发。没有立即捕获，自动化将死锁等待被阻塞的 CDP 响应。

## IFrame 架构：Tab 重用模式

**关键洞察：** IFrame 是 **CDP 的一等目标** → 表示为 `Tab` 实例。

**目标解析算法：**

1. 从 iframe 元素提取 `src` 属性
2. 通过 `Target.getTargets()` 查询所有 CDP 目标
3. 将 iframe URL 匹配到目标 `targetId`
4. 检查单例注册表（`Browser._tabs_opened`）
5. 返回现有实例或创建 + 注册新 Tab

**设计权衡：** IFrame 标签页继承所有 Tab 方法，但有些会失败（例如 `take_screenshot()`）。替代方案（专用的 `IFrame` 类）将为最小的好处复制 90% 的 API。

!!! info "使用 IFrame"
    有关实际模式、嵌套框架和常见陷阱，请参阅 [IFrame 交互指南](../features/automation/iframes.md)。

## 上下文管理器：自动资源清理

**架构模式：** 状态恢复 + 乐观资源获取。

### 关键上下文管理器

| 管理器 | 模式 | 关键特性 |
|---------|---------|-------------|
| `expect_file_chooser()` | 状态恢复 | 退出后恢复域启用 |
| `expect_download()` | 临时资源 | 自动清理临时目录 |

**文件选择器设计：**

- 启用所需的域（`Page`、文件选择器拦截）
- 注册**临时回调**（首次触发后自动删除）
- 退出时恢复原始状态（如果之前禁用了域，则再次禁用）

**下载处理设计：**

- 创建临时目录（或使用提供的路径）
- 使用 `asyncio.Future` 进行协调（`will_begin_future`、`done_future`）
- 浏览器级别配置（下载是每个上下文的，而不是每个标签页的）
- 通过 `finally` 块保证清理

!!! info "实际文件操作"
    有关上传模式、文件选择器使用和下载处理，请参阅[文件操作指南](../features/automation/file-operations.md)。

## 生命周期：Tab 关闭和失效

**Tab 关闭级联：**

1. CDP 关闭浏览器标签页（`Page.close`）
2. Tab 从 `Browser._tabs_opened` 注销
3. WebSocket 自动关闭（CDP 目标已销毁）
4. 事件回调被垃圾回收

**关闭后行为：** Tab 实例变为**无效** - 进一步的操作失败（WebSocket 已关闭）。

**设计决策：** 没有显式的 `_closed` 标志。用户管理生命周期。替代方案（状态跟踪）为边际安全好处增加了开销。

## 关键架构决策

### 每个 Tab 的 WebSocket 策略

**选择的设计：** 每个 Tab 创建自己的 ConnectionHandler，具有到 `ws://localhost:port/devtools/page/{targetId}` 的专用 WebSocket 连接。

**理由：**

CDP 支持**两种连接模型**：

1. **浏览器级别**：到 `ws://localhost:port/devtools/browser/...` 的单个连接（由 Browser 实例使用）
2. **Tab 级别**：到 `ws://localhost:port/devtools/page/{targetId}` 的每个标签页连接（由 Tab 实例使用）

Pydoll 使用**两者**：

- **Browser** 有自己的 ConnectionHandler，用于浏览器范围的操作（上下文、下载、浏览器级别事件）
- **每个 Tab** 有自己的 ConnectionHandler，用于标签页特定的操作（导航、元素查找、标签页事件）

**每个标签页 WebSocket 的好处：**

- **真正的并行性**：多个标签页可以同时执行 CDP 命令而无需等待
- **独立的事件流**：每个标签页仅接收自己的事件（无需过滤）
- **隔离的故障**：一个标签页中的连接问题不会影响其他标签页
- **简化路由**：无需按 targetId 解复用消息

**权衡：** 更多打开的连接（每个标签页一个），但 CDP 和浏览器可以有效地处理这一点。对于 10 个标签页，这总共是 11 个连接（1 个浏览器 + 10 个标签页），与标签页本身创建的 HTTP 连接相比可以忽略不计。

!!! info "浏览器与 Tab 通信"
    有关浏览器级别 ConnectionHandler 以及 Browser/Tab 协调如何工作的详细信息，请参阅 [Browser 域架构](./browser-domain.md)。

### 浏览器引用的必要性

**为什么 Tab 存储 `_browser` 引用：**
- 上下文查询（cookie 的 `browser_context_id`）
- 浏览器级别操作（下载行为、iframe 注册表）
- 配置访问（`browser.options.page_load_state`）

### API 设计选择

| 选择 | 理由 |
|--------|-----------|
| **异步属性**（`current_url`、`page_source`） | 信号实时数据 + CDP 成本 |
| **单独的 `enable`/`disable` 方法** | 显式优于隐式，匹配 CDP 命名 |
| **无 `_closed` 标志** | 用户管理生命周期，减少开销 |
| **脚本中的 `argument` 关键字** | Selenium 兼容性，迁移路径 |

## 与其他域的关系

Tab 域位于 Pydoll 架构的**中心**：

```mermaid
graph TD
    Browser[Browser Domain<br/>Lifecycle & Process] -->|creates| Tab[Tab Domain<br/>Automation Interface]
    Tab -->|uses| ConnectionHandler[ConnectionHandler<br/>CDP Communication]
    Tab -->|creates| WebElement[WebElement Domain<br/>Element Interaction]
    Tab -->|inherits| FindMixin[FindElementsMixin<br/>Locator Strategies]
    Tab -->|uses| Commands[CDP Commands<br/>Typed Protocol]
    
    ConnectionHandler -->|dispatches| Events[Event System]
    Tab -.->|references| Browser
    WebElement -.->|references| ConnectionHandler
```

**关键关系：**

1. **Browser → Tab**：父子关系。Browser 管理 Tab 生命周期和共享状态。
2. **Tab → ConnectionHandler**：组合。Tab 委托 CDP 通信。
3. **Tab → WebElement**：工厂。Tab 从 `objectId` 字符串创建元素。
4. **Tab ← FindElementsMixin**：继承。Tab 获得元素定位方法。
5. **Tab ↔ Browser**：双向引用。Tab 查询浏览器以获取上下文信息。

## 总结：设计理念

Tab 域优先考虑 **API 人体工程学**和**正确性**而不是微优化：

- **外观模式**抽象 CDP 复杂性
- 通过显式标志进行**状态管理**，防止双重启用
- 通过上下文管理器进行**资源管理**
- 具有后台执行（非阻塞）的**事件协调**

**核心权衡：**

| 决策 | 好处 | 成本 | 判定 |
|----------|---------|------|---------|
| 每个标签页的 WebSocket | 真正的并行性 | 更多连接 | 合理 |
| 继承 FindElementsMixin | 简洁的 API | 紧密耦合 | 合理 |
| 延迟 Request 初始化 | 内存效率 | 属性开销 | 合理 |

## 进一步阅读

**实用指南：**

- [Tab 管理](../features/automation/tabs.md) - 多标签页模式、生命周期、并发
- [元素查找](../features/element-finding.md) - 选择器和 DOM 遍历
- [事件系统](../features/advanced/event-system.md) - 实时浏览器监控

**架构深入探讨：**

- [事件架构](./event-architecture.md) - WebSocket 管道和事件路由
- [FindElements Mixin](./find-elements-mixin.md) - 选择器解析算法
- [Browser 域](./browser-domain.md) - 进程管理和上下文


================================================
FILE: docs/zh/deep-dive/architecture/webelement-domain.md
================================================
# WebElement 域架构

WebElement 域通过 Chrome DevTools Protocol 在高级自动化代码和低级 DOM 交互之间架起桥梁。本文档探讨其内部架构、设计模式和工程决策。

!!! info "实用使用"
    有关使用示例和交互模式，请参阅：
    
    - [元素查找指南](../features/element-finding.md)
    - [类人交互](../features/automation/human-interactions.md)
    - [文件操作](../features/automation/file-operations.md)

## 架构概述

WebElement 通过 CDP 的 `objectId` 机制表示对 DOM 元素的**远程对象引用**：

```
用户代码 → WebElement → ConnectionHandler → CDP Runtime → 浏览器 DOM
```

**关键特性：**

- **异步设计**：所有操作都遵循 Python 的 async/await 模式
- **远程引用**：维护 CDP `objectId` 以引用浏览器端元素
- **Mixin 继承**：继承 `FindElementsMixin` 以进行子元素搜索
- **混合状态**：结合缓存属性和实时 DOM 查询

### 核心状态

```python
class WebElement(FindElementsMixin):
    def __init__(self, object_id: str, connection_handler: ConnectionHandler, ...):
        self._object_id = object_id              # CDP 远程对象引用
        self._connection_handler = connection_handler  # WebSocket 通信
        self._attributes: dict[str, str] = {}    # 缓存的 HTML 属性
        self._search_method = method             # 元素如何被找到（调试）
        self._selector = selector                # 原始选择器（调试）
```

**为什么缓存属性？** 初始元素定位返回 HTML 属性。缓存提供对常见属性（`id`、`class`、`tag_name`）的快速同步访问，无需额外的 CDP 调用。

## 设计模式

### 1. 命令模式

所有元素交互都转换为 CDP 命令：

| 用户操作 | CDP 域 | 命令 |
|----------------|-----------|---------|
| `element.click()` | Input | `Input.dispatchMouseEvent` |
| `element.text` | Runtime | `Runtime.callFunctionOn` |
| `element.bounds` | DOM | `DOM.getBoxModel` |
| `element.take_screenshot()` | Page | `Page.captureScreenshot` |

### 2. 桥接模式

WebElement 抽象 CDP 协议复杂性：

```python
async def click(self, x_offset=0, y_offset=0, hold_time=0.1):
    # 高级 API
    
    # → 转换为低级 CDP 命令：
    # 1. DOM.getBoxModel（获取位置）
    # 2. Input.dispatchMouseEvent（按下）
    # 3. Input.dispatchMouseEvent（释放）
```

### 3. 用于子搜索的 Mixin 继承

**为什么继承 FindElementsMixin？** 启用元素相对搜索：

```python
form = await tab.find(id='login-form')
username = await form.find(name='username')  # 在表单内搜索
```

**设计决策：** 组合（`form.finder.find()`）会更灵活但不太符合人体工程学。为了 API 简单性选择继承。

## 混合属性系统

**架构创新：** WebElement 结合同步和异步属性访问。

### 同步属性（缓存属性）

```python
@property
def id(self) -> str:
    return self._attributes.get('id')  # 来自缓存的 HTML 属性

@property  
def class_name(self) -> str:
    return self._attributes.get('class_name')  # 'class' → 'class_name'（Python 关键字）
```

**来源：** 来自 CDP 元素定位响应的扁平列表，在 `__init__` 期间解析。

### 异步属性（实时 DOM 状态）

```python
@property
async def text(self) -> str:
    outer_html = await self.inner_html  # CDP 调用
    soup = BeautifulSoup(outer_html, 'html.parser')
    return soup.get_text(strip=True)

@property
async def bounds(self) -> dict:
    response = await self._execute_command(DomCommands.get_box_model(self._object_id))
    # 解析并返回边界
```

**理由：** 文本和边界是**动态的** - 它们随着页面更新而变化。属性是**静态的** - 在定位时捕获。

| 属性类型 | 访问 | 来源 | 用例 |
|--------------|--------|--------|----------|
| 同步 | `element.id` | 缓存属性 | 快速访问、静态数据 |
| 异步 | `await element.text` | 实时 CDP 查询 | 当前状态、动态数据 |

## 点击实现：多阶段管道

点击操作遵循复杂的管道以确保可靠性：

### 1. 特殊元素检测

```python
async def click(self, x_offset=0, y_offset=0, hold_time=0.1):
    # 阶段 1：处理特殊元素
    if self._is_option_tag():
        return await self.click_option_tag()  # <option> 需要 JavaScript 选择
```

**为什么特殊处理？** `<select>` 内的 `<option>` 元素不响应鼠标事件。需要 JavaScript `selected = true`。

### 2. 可见性检查

```python
    # 阶段 2：验证元素是否可见
    if not await self.is_visible():
        raise ElementNotVisible()
```

**为什么检查？** CDP 鼠标事件目标坐标。隐藏的元素会在错误位置接收点击或静默失败。

### 3. 位置计算

```python
    # 阶段 3：滚动到视图并获取位置
    await self.scroll_into_view()
    bounds = await self.bounds
    
    # 阶段 4：计算点击坐标
    position_to_click = (
        bounds['x'] + bounds['width'] / 2 + x_offset,
        bounds['y'] + bounds['height'] / 2 + y_offset,
    )
```

**偏移支持：** 启用各种点击位置以实现类人行为（反检测）。

### 4. 鼠标事件分发

```python
    # 阶段 5：发送 CDP 鼠标事件
    await self._execute_command(InputCommands.mouse_press(*position_to_click))
    await asyncio.sleep(hold_time)  # 可配置的保持时间（默认 0.1 秒）
    await self._execute_command(InputCommands.mouse_release(*position_to_click))
```

**为什么两个命令？** 模拟真实的鼠标行为（按下 → 保持 → 释放）。一些网站检测即时点击为机器人。

### 点击回退：JavaScript 替代方案

```python
async def click_using_js(self):
    """无法通过鼠标事件点击的元素的回退。"""
    await self.execute_script('this.click()')
```

**何时使用：**
- 隐藏元素（例如，使用 CSS 样式的文件输入）
- 叠加层后面的元素
- 性能关键场景（跳过可见性/位置检查）

!!! info "鼠标 vs JavaScript 点击"
    请参阅[类人交互](../features/automation/human-interactions.md)了解何时使用每种方法及检测影响。

## 截图架构：裁剪区域

**关键机制：** 带有 `clip` 参数的 `Page.captureScreenshot`。

```python
async def take_screenshot(self, path: str, quality: int = 100):
    # 1. 获取元素边界（位置 + 尺寸）
    bounds = await self.get_bounds_using_js()
    
    # 2. 创建裁剪区域
    clip = Viewport(x=bounds['x'], y=bounds['y'], 
                    width=bounds['width'], height=bounds['height'], scale=1)
    
    # 3. 仅捕获裁剪区域
    screenshot = await self._execute_command(
        PageCommands.capture_screenshot(format=ScreenshotFormat.JPEG, clip=clip, quality=quality)
    )
```

**为什么使用 JavaScript 边界？** `DOM.getBoxModel` 可能对某些元素失败。JavaScript `getBoundingClientRect()` 是更可靠的回退。

**格式限制：** 元素截图始终使用 JPEG（带裁剪区域的 CDP 限制）。

!!! info "截图功能"
    请参阅[截图和 PDF](../features/automation/screenshots-and-pdfs.md)了解整页与元素截图的比较。

## JavaScript 执行上下文

**关键 CDP 功能：** `Runtime.callFunctionOn(objectId, ...)` 在元素上下文中执行 JavaScript（`this` = 元素）。

```python
async def execute_script(self, script: str, return_by_value=False):
    return await self._execute_command(
        RuntimeCommands.call_function_on(self._object_id, script, return_by_value)
    )
```

**用例：**

- 可见性检查：`await element.is_visible()` → JavaScript 检查计算样式
- 样式操作：`await element.execute_script("this.style.border = '2px solid red'")`
- 属性访问：某些属性需要 JavaScript（例如，输入的 `value`）

**替代方案（未使用）：** 使用元素选择器执行全局脚本 → 较慢，有陈旧引用风险。

## 状态验证管道

**可靠性策略：** 在交互之前预先检查元素状态以防止失败。

| 检查 | 目的 | 实现 |
|-------|---------|----------------|
| `is_visible()` | 元素在视口中，未隐藏 | JavaScript：`offsetWidth > 0 && offsetHeight > 0` |
| `is_on_top()` | 没有叠加层阻挡元素 | JavaScript：`document.elementFromPoint(x, y) === this` |
| `is_interactable()` | 可见 + 在顶部 | 结合两项检查 |

**为什么使用 JavaScript 检查可见性？** CSS `display: none`、`visibility: hidden`、`opacity: 0` 都以不同方式影响可见性。JavaScript 提供统一检查。

## 性能策略

### 1. 特定于操作的优化

**原则：** 为每种操作类型选择最快的方法。

| 操作 | 主要方法 | 理由 |
|-----------|-----------------|-----------|
| 文本提取 | BeautifulSoup 解析 | 比 JavaScript `innerText` 更准确 |
| 可见性检查 | JavaScript | 单个 CDP 调用 vs 多个 DOM 查询 |
| 点击 | CDP 鼠标事件 | 最真实，反检测所需 |
| 边界 | `DOM.getBoxModel` | 比 JavaScript 快，有 JS 回退 |

### 2. 本地计算

**最小化 CDP 往返**，尽可能在本地计算：

```python
# 好：单次边界查询，本地计算
bounds = await element.bounds
click_x = bounds['x'] + bounds['width'] / 2 + offset_x
click_y = bounds['y'] + bounds['height'] / 2 + offset_y

# 不好：为简单数学进行多次 CDP 调用
click_x = await element.execute_script('return this.offsetLeft + this.offsetWidth / 2')
click_y = await element.execute_script('return this.offsetTop + this.offsetHeight / 2')
```

### 3. 缓存属性

**设计决策：** 在创建时缓存静态属性：

```python
# 快速同步访问（无 CDP 调用）
element_id = element.id
element_class = element.class_name
```

**权衡：** 属性不会反映运行时更改。对于动态属性，使用异步：`await element.text`。

## 关键架构决策

| 决策 | 理由 |
|----------|-----------|
| **继承 FindElementsMixin** | 启用子搜索，维护 API 一致性 |
| **混合同步/异步属性** | 平衡性能（同步）与新鲜度（异步）|
| **JavaScript 回退** | 关键操作的可靠性优于性能 |
| **特殊元素检测** | `<option>`、`<input type="file">` 需要独特处理 |
| **点击前可见性检查** | 清晰错误的快速失败 vs 静默失败 |

## 总结

WebElement 域通过以下方式在 Python 自动化代码和浏览器 DOM 之间架起桥梁：

- **远程对象引用**通过 CDP `objectId`
- **混合属性系统**平衡同步属性和异步状态
- **多阶段交互管道**确保可靠性
- **专门处理**元素类型变化

**核心权衡：**

| 决策 | 收益 | 成本 | 结论 |
|----------|---------|------|---------|
| Mixin 继承 | 干净的 API | 紧耦合 | 合理 |
| 缓存属性 | 快速同步访问 | 陈旧数据风险 | 合理 |
| JavaScript 回退 | 可靠性 | 性能损失 | 合理 |
| 可见性预检查 | 清晰错误 | 额外的 CDP 调用 | 合理 |

## 进一步阅读

**实用指南：**

- [元素查找](../features/element-finding.md) - 定位元素、选择器
- [类人交互](../features/automation/human-interactions.md) - 点击、输入、真实性
- [文件操作](../features/automation/file-operations.md) - 文件上传和下载

**架构深入了解：**

- [FindElements Mixin](./find-elements-mixin.md) - 选择器解析管道
- [Tab 域](./tab-domain.md) - Tab 作为元素工厂
- [连接层](./connection-layer.md) - WebSocket 通信


================================================
FILE: docs/zh/deep-dive/fingerprinting/behavioral-fingerprinting.md
================================================
# 行为 Fingerprinting

行为 fingerprinting 分析的是用户与 Web 应用的交互方式，而非他们使用的工具。虽然网络和浏览器指纹可以通过设置正确的值来伪造，但人类行为遵循生物力学模式，难以令人信服地复制。检测系统收集鼠标移动、击键时间、滚动行为和交互序列，然后使用统计模型来区分人类和自动化。

本文档涵盖检测技术、背后的科学原理，以及 Pydoll 的人性化功能如何应对各个检测向量。

!!! info "模块导航"
    - [网络 Fingerprinting](./network-fingerprinting.md)：TCP/IP、TLS、HTTP/2 协议 fingerprinting
    - [浏览器 Fingerprinting](./browser-fingerprinting.md)：Canvas、WebGL、navigator 属性
    - [规避技术](./evasion-techniques.md)：实用对策

## 鼠标移动分析

鼠标移动是最强大的行为指标之一，因为人类的运动控制遵循生物力学定律，简单的自动化无法复制。检测系统收集 `mousemove` 事件（每个事件包含 x、y 坐标和时间戳），并分析轨迹的属性，以区分有机移动和程序化光标瞬移。

### Fitts's Law

Fitts's Law 描述将指针移动到目标所需的时间。Shannon 公式（MacKenzie, 1992）是使用最广泛的版本，表述如下：

```
T = a + b * log2(D/W + 1)
```

其中 `T` 是移动时间，`a` 是代表反应/启动时间的常数，`b` 是代表输入设备固有速度的常数，`D` 是到目标的距离，`W` 是目标的宽度（大小）。对数关系意味着距离加倍会增加固定的时间量，而目标大小减半也会增加相同的固定时间量。

这对机器人检测具有重要意义。人类到达小而远的目标需要更长时间，而到达大而近的目标则很快。他们在移动开始时加速，大约在路径中点达到峰值速度，并在接近目标时减速。如果机器人无论距离和目标大小如何都以恒定时间移动光标，就违反了 Fitts's Law，很容易被检测到。

检测系统测量每次点击事件的移动时间，根据距离和目标大小计算预期时间，并标记那些明显快于 Fitts's Law 预测或在距离/大小与移动时间之间没有相关性的移动。

### 轨迹形状

两点之间的人类手部移动不是直线。Abend、Bizzi 和 Morasso（1982）的研究表明，由于手臂关节和肌肉的生物力学约束，手部路径通常是弯曲的。Flash 和 Hogan（1985）证明，人类到达运动遵循最小 jerk 轨迹，即轨迹在移动持续时间内最小化 jerk（加速度的导数）的积分。由此产生的速度曲线呈钟形，用五次（5 阶）多项式描述：

```
x(t) = x0 + (xf - x0) * (10t^3 - 15t^4 + 6t^5)
```

其中 `t` 是从 0 到 1 的归一化时间，`x0`/`xf` 是起始和终止位置。这会产生从静止开始的平滑加速、大约在路径中点的峰值速度，以及回到静止的平滑减速。

检测系统分析轨迹曲率、速度曲线和加速度模式。它们寻找的具体信号包括：

**直线检测。** 两点之间完全笔直的路径（每个采样点曲率为零）是最明显的机器人信号。由于手臂旋转关节的存在，人类路径总是有一定的曲率。

**恒定速度。** 人类表现出钟形速度曲线（加速、达到峰值、减速）。整个移动过程中恒定的速度表明是线性插值，这是大多数自动化工具的默认行为。

**缺少子移动。** 长距离移动由多个重叠的子移动组成（Meyer 等，1988），每个子移动都有自己的速度峰值。覆盖 500+ 像素但只有一个平滑速度峰值的移动是可疑的；该距离的真实移动通常会显示 2-4 个速度峰值。

**无 overshoot。** 人类经常会略微超过目标（5-15 像素），然后做一个小的校正回来。每次都精确命中目标的完美移动在统计上是不可能的。

### 移动熵

在这个语境中，熵衡量鼠标路径的不可预测性。检测系统将轨迹分成段，测量每个点的方向变化，并计算方向变化分布上的 Shannon 熵。直线的熵为零（每段指向相同方向）。随机游走的熵最大。人类移动具有中等到高的熵，反映了有意方向和非自主变异性的结合。

在一个会话中多次鼠标移动都表现出低熵是一个强烈的机器人信号，即使个别移动具有合理的曲率。

### Pydoll 的鼠标 humanize 功能

Pydoll 通过点击操作上的 `humanize=True` 参数实现了全面的鼠标人性化。启用后，鼠标模块会生成针对上述每个检测向量的移动：

路径遵循带有随机控制点的三次 Bezier 曲线，产生自然曲率而非直线。沿路径的速度遵循最小 jerk 曲线（`10t^3 - 15t^4 + 6t^5`），产生 Fitts's Law 预测的钟形速度曲线。移动持续时间使用 Fitts's Law 和可配置常数（默认 `a=0.070`，`b=0.150`）计算。

通过向光标位置添加高斯噪声来模拟生理震颤，振幅与速度成反比（当手移动缓慢时震颤更明显，这与真实生理学一致）。overshoot 以 70% 的概率发生，超过目标总距离的 3-12%，然后进行校正移动。微停顿（15-40ms）以 3% 的概率在移动过程中发生，模拟短暂的犹豫。

```python
# 基本的 humanize 点击
await element.click(humanize=True)

# 也可以直接使用 Mouse 类获得更多控制
from pydoll.interactions.mouse import Mouse

mouse = Mouse(connection_handler)
await mouse.click(500, 300, humanize=True)
```

!!! note "Pydoll 目前未实现的功能"
    Pydoll 的鼠标人性化目前不会对非常长的距离建模子移动（路径是单个 Bezier 段）。对于大多数 Web 交互（距离在 500 像素以内），这已经足够了。极长的移动（全屏对角线穿越）可能会受益于未来的多段支持。

## 击键动态

击键动态分析键盘输入的时间模式。该技术可以追溯到 1850 年代的电报操作员，他们可以通过各自的莫尔斯电码"拳头"（特征性时间模式）来识别彼此。现代系统通过 `keydown` 和 `keyup` 事件以毫秒精度测量时间。

### 时间特征

两个基本测量是停留时间（单个按键 `keydown` 和 `keyup` 之间的持续时间，人类通常为 50-200ms）和飞行时间（释放一个键到按下下一个键之间的持续时间，通常为 80-400ms）。连续按键对的停留时间和飞行时间的组合称为二元组（digraph）延迟。

二元组延迟并不均匀。它们取决于键入的特定按键对（bigram），因为打字是一种运动技能，常见序列存储为程序记忆。关键的生物力学因素包括：

**双手交替。** 用双手交替输入的 bigram（如 "th"，在 QWERTY 键盘上 "t" 是左手，"h" 是右手）通常比同一只手输入的 bigram（如 "de"，两个键都在左手）更快。交替手可以在第一只手完成击键时就开始移动。

**手指距离。** 主行到主行的过渡最快。到达顶行或底行会增加与手指必须移动的物理距离成比例的时间。

**手指独立性。** 同一只手上的无名指和小指组合比食指和中指组合更慢，因为无名指和小指共享肌腱，独立运动控制能力较弱。

**频率效应。** 经常输入的 bigram（如英语中的 "th"、"er"、"in"）由于运动记忆而执行更快，与其物理布局无关。

### 检测信号

检测系统寻找几种将人类打字与自动化区分开的信号：

**零或恒定停留时间。** 许多自动化工具在 `keydown` 和 `keyup` 事件之间以零或接近零的延迟（低于 5ms）发送。真实的按键具有可测量的停留时间。所有按键的停留时间恒定同样可疑。

**均匀飞行时间。** 设置固定的击键间隔（如 `type_text("hello", interval=0.1)`）会产生完全规律的时间，非常容易被检测。人类的飞行时间因 bigram、疲劳和认知负荷而变化。

**无打字错误。** 在较长的文本输入（50+ 个字符）中，完全没有退格键或删除键的按下是不寻常的。人类的错误率大约为 1-5%，取决于打字熟练度和文本复杂度。

**超人速度。** 持续超过 150 WPM 的打字速度超出了除精英竞技打字员以外所有人的能力。比这更快发送字符的自动化工具会立即被标记。

### Pydoll 的键盘 humanize 功能

Pydoll 的 `type_text(humanize=True)` 通过可配置参数应对每个检测向量：

击键延迟从均匀分布中抽取（默认 30-120ms），而不是固定间隔。标点字符（`.!?;:,`）接收额外延迟（80-180ms），模拟打字者考虑句子结构时的停顿。思考停顿（300-700ms）以 2% 的概率发生，模拟短暂的思考时刻。分心停顿（500-1200ms）以 0.5% 的概率发生，模拟打字者看向别处或被短暂打断。

逼真的打字错误以大约每字符 2% 的概率发生，包含五种按其真实世界频率加权的不同错误类型：相邻键错误（55%，按下 QWERTY 键盘上的相邻键）、换位（20%，交换两个连续字符）、重复按键（12%，连续按两次键）、跳过字符（8%，在正确输入前犹豫）和遗漏空格（5%，忘记单词之间的空格）。每种错误类型包含逼真的恢复序列（停顿、退格、校正）和适当的时间。

```python
# Humanize 打字
await element.type_text("Hello, world!", humanize=True)

# 使用自定义时间配置
from pydoll.interactions.keyboard import Keyboard, TimingConfig, TypoConfig

config = TimingConfig(
    keystroke_min=0.04,
    keystroke_max=0.15,
    thinking_probability=0.03,
)
keyboard = Keyboard(connection_handler, timing_config=config)
await keyboard.type_text("Custom timing example", humanize=True)
```

!!! note "Pydoll 目前未实现的功能"
    Pydoll 的键盘人性化使用均匀随机延迟，而非基于 bigram 的时间。它不会建模每个按键的停留时间变化或双手交替速度差异。对于大多数自动化场景（表单填写、搜索查询），均匀变化足以通过行为检测。需要认证级别击键生物识别规避的应用需要自定义时间模型。

## 滚动行为分析

滚动 fingerprinting 分析用户如何在页面内容中进行垂直（和水平）导航。人类滚动和自动滚动之间的区别非常明显：程序化的 `window.scrollTo()` 调用产生即时的离散跳跃，而通过鼠标滚轮、触控板或触摸屏进行的人类滚动则产生一连串带有惯性和减速效果的小增量事件。

### 物理滚动特征

鼠标滚轮滚动产生带有一致 delta 值的离散 `wheel` 事件（通常每个凹槽 100 或 120 像素，取决于操作系统和浏览器）。事件以不规则的间隔到达，反映用户转动滚轮的速度。触控板滚动产生许多小事件，delta 值递减，模拟物理惯性。触摸滚动类似于触控板，但初始 delta 更大，减速尾部更长。

检测系统分析 delta 分布、事件间时间和减速曲线。`scrollTo(0, 5000)` 调用产生单次跳跃且没有中间事件，这与人类滚动产生的数百个增量事件根本不同。

### 检测信号

**即时滚动。** 使用 `window.scrollTo()` 或 `window.scrollBy()` 配合大值会产生零中间滚动事件。监听 `scroll` 事件的检测系统会看到滚动位置在单帧内发生变化。

**均匀 delta。** 程序化滚动模拟以恒定 delta 值发送 wheel 事件（例如始终 100 像素），缺少人类滚动中的自然变化，人类滚动的 delta 值由于手指压力不一致会波动 10-30%。

**无减速。** 人类滚动，尤其是在触控板上，有一个惯性阶段，在用户抬起手指后滚动继续，速度呈指数递减。突然停止的自动滚动缺少这个减速尾部。

**缺少方向变化。** 人类经常过度滚动然后略微回滚，或在页面中途暂停阅读内容。以恒定速度沿一个方向移动而没有暂停或反转的自动滚动是可疑的。

### Pydoll 的滚动 humanize 功能

Pydoll 的滚动模块通过 `scroll.by(position, distance, humanize=True)` 实现人性化滚动：

滚动遵循三次 Bezier 缓动曲线（默认控制点 `0.645, 0.045, 0.355, 1.0`），产生自然的加速和减速。每帧 ±3 像素的 jitter 为 delta 值添加变化。微停顿（20-50ms）以 5% 的概率发生，模拟短暂的阅读停顿。overshoot 以 15% 的概率发生，滚过目标 2-8% 然后校正回来。对于长距离，滚动被分解为多个"轻弹"手势（每次 100-1200 像素），模拟真实用户通过重复滑动而非单次连续动作来滚动长页面的方式。

```python
from pydoll.interactions.scroll import Scroll, ScrollPosition

scroll = Scroll(connection_handler)

# Humanize 向下滚动 800 像素
await scroll.by(ScrollPosition.Y, 800, humanize=True)

# 滚动到顶部/底部使用多次类人轻弹
await scroll.to_bottom(humanize=True)
```

## 其他检测向量

除了鼠标、键盘和滚动分析之外，复杂的检测系统还监控其他几种行为信号。

### 焦点和可见性

Page Visibility API（`document.visibilityState`）和焦点事件（`window.onfocus`、`window.onblur`）揭示用户是否在主动查看页面。真实用户的会话包括标签页切换、窗口最小化和不活动期。一个连续保持焦点数小时而没有一个 blur 事件的自动化脚本在行为上是异常的。同样，`document.hasFocus()` 在较长时间内持续返回 `true` 也是不寻常的。

### 空闲模式

真实用户有自然的空闲期：阅读内容、在行动前思考、被分心。检测系统测量交互之间空闲时间的分布。如果一个会话中每个动作都在前一个动作的 100-500ms 内发生，没有更长的停顿，这种模式在统计上与人类浏览有明显区别——人类浏览中动作之间 2-30 秒的空闲期是正常的。

### 事件序列完整性

浏览器为用户交互生成特定的事件序列。一次鼠标点击产生 `pointerdown`、`mousedown`、`pointerup`、`mouseup`、`click`，按此顺序，之前还有 `pointermove`/`mousemove` 事件显示光标正在接近点击目标。发送裸 `click` 事件而没有前置移动和指针事件的自动化工具可以通过事件序列分析被检测到。

Pydoll 基于 CDP 的事件发送生成完整的事件序列，因为它使用 Chrome 的输入模拟，产生与真实用户输入相同的事件链。

## 机器学习检测

现代反机器人系统（DataDome、Akamai Bot Manager、Cloudflare Bot Management、PerimeterX/HUMAN Security）不使用简单的阈值规则。它们在数百万真实用户会话和数百万已知机器人会话上训练机器学习模型，学习基于 50+ 个特征同时区分人类和自动化。

这些模型捕获难以列举为单独规则的统计属性：移动速度和曲率的联合分布、打字速度和错误率之间的相关性、滚动深度和阅读时间之间的关系，以及浏览会话的整体"节奏"。一个通过每项单独检查但在特征之间存在微妙错误相关性的系统，仍然可以被训练良好的模型标记。

实际意义在于，行为规避必须在所有交互类型之间保持一致，而不仅仅是单独看起来合理。Pydoll 的 `humanize=True` 参数提供了跨鼠标、键盘和滚动交互的连贯人性化层，但开发者仍然需要负责更高层面的行为合理性：在页面加载之间添加阅读延迟、变化多页工作流的节奏，以及包含自然的空闲期。

## 参考文献

- Fitts, P. M. (1954). The Information Capacity of the Human Motor System in Controlling the Amplitude of Movement. Journal of Experimental Psychology.
- MacKenzie, I. S. (1992). Fitts' Law as a Research and Design Tool in Human-Computer Interaction. Human-Computer Interaction.
- Flash, T., & Hogan, N. (1985). The Coordination of Arm Movements: An Experimentally Confirmed Mathematical Model. Journal of Neuroscience.
- Abend, W., Bizzi, E., & Morasso, P. (1982). Human Arm Trajectory Formation. Brain.
- Meyer, D. E., Abrams, R. A., Kornblum, S., Wright, C. E., & Smith, J. E. K. (1988). Optimality in Human Motor Performance. Psychological Review.
- Ahmed, A. A. E., & Traore, I. (2007). A New Biometric Technology Based on Mouse Dynamics. IEEE TDSC.


================================================
FILE: docs/zh/deep-dive/fingerprinting/browser-fingerprinting.md
================================================
# 浏览器 Fingerprinting

浏览器 fingerprinting 通过分析 JavaScript API、HTTP 标头和渲染引擎暴露的属性来识别客户端。与网络 fingerprinting 检查操作系统内核和 TLS 库的协议级信号不同，浏览器 fingerprinting 针对的是应用层：具体的浏览器、版本、配置以及运行它的硬件。这些信号可以通过标准 Web API 被任何网站访问，而足够多属性的组合往往能在数百万访客中创建出唯一的指纹。

!!! info "模块导航"
    - [网络 Fingerprinting](./network-fingerprinting.md): TCP/IP、TLS、HTTP/2 协议 fingerprinting
    - [行为 Fingerprinting](./behavioral-fingerprinting.md): 鼠标、键盘、滚动分析
    - [规避技术](./evasion-techniques.md): 实用对策

## JavaScript Navigator 属性

`navigator` 对象是浏览器 fingerprinting 数据最丰富的单一来源。它暴露了数十个属性，揭示了浏览器、其功能以及运行它的系统。检测系统会收集这些属性，将它们相互交叉比对并与 HTTP 标头进行对照，标记出不一致之处。

以下 JavaScript 收集了 fingerprinting 系统通常检查的核心属性集：

```javascript
const fingerprint = {
    // Identity
    userAgent: navigator.userAgent,
    platform: navigator.platform,
    vendor: navigator.vendor,

    // Language and locale
    language: navigator.language,
    languages: navigator.languages,

    // Hardware
    hardwareConcurrency: navigator.hardwareConcurrency,
    deviceMemory: navigator.deviceMemory,
    maxTouchPoints: navigator.maxTouchPoints,

    // Features
    cookieEnabled: navigator.cookieEnabled,
    doNotTrack: navigator.doNotTrack,
    webdriver: navigator.webdriver,

    // Screen
    screenWidth: screen.width,
    screenHeight: screen.height,
    colorDepth: screen.colorDepth,
    devicePixelRatio: window.devicePixelRatio,

    // Window chrome (toolbar, scrollbar dimensions)
    chromeHeight: window.outerHeight - window.innerHeight,
    chromeWidth: window.outerWidth - window.innerWidth,

    // Timezone
    timezone: Intl.DateTimeFormat().resolvedOptions().timeZone,
    timezoneOffset: new Date().getTimezoneOffset(),
};
```

其中一些属性值得单独关注，因为它们在 fingerprinting 中权重更高，或者更容易被自动化工具错误配置。

### 平台与 User-Agent 一致性

`navigator.platform` 属性返回一个字符串，如 `Win32`、`MacIntel` 或 `Linux x86_64`。检测系统会将其与 User-Agent 标头进行比较。如果 HTTP User-Agent 声称是 `Windows NT 10.0`，但 `navigator.platform` 返回 `Linux x86_64`，这种不匹配就是一个强烈的信号。这是自动化中最常见的错误之一：通过 `--user-agent=` 设置了自定义 User-Agent，却没有同时覆盖 platform。

### 硬件属性

`navigator.hardwareConcurrency` 返回逻辑 CPU 核心数。值为 1 或 2 通常意味着是最小化的虚拟机或容器，而非真实用户的机器。`navigator.deviceMemory` 以 GB 为单位报告大致的 RAM 容量（0.25、0.5、1、2、4、8）。此属性仅在 Chromium 浏览器中可用；Firefox 和 Safari 返回 `undefined`。这两个值应与声称的设备一致：User-Agent 声称是现代桌面设备，却报告 1 个核心和 0.5 GB RAM，这是可疑的。

### WebDriver 属性

当浏览器被基于 WebDriver 的自动化工具（Selenium、以 WebDriver 模式运行的 Playwright）控制时，`navigator.webdriver` 属性为 `true`。这是最明显的自动化指标。Pydoll 直接使用 CDP（Chrome DevTools Protocol），不会设置此标志。在 Pydoll 控制的浏览器中，`navigator.webdriver` 为 `undefined`，与正常用户会话的行为一致。

### 插件

`navigator.plugins` 属性在历史上是一个强力的 fingerprinting 向量，因为不同的浏览器和操作系统配置会暴露不同的插件列表。现代 Chromium 浏览器（Chrome 90+）无论实际插件状态如何，都返回固定的五个 PDF 相关插件：

```javascript
// Modern Chrome always returns these 5 plugins:
// 1. PDF Viewer
// 2. Chrome PDF Viewer
// 3. Chromium PDF Viewer
// 4. Microsoft Edge PDF Viewer
// 5. WebKit built-in PDF
console.log(navigator.plugins.length); // 5
```

一个常见的误解认为现代浏览器会为 `navigator.plugins` 返回空数组。这是不正确的。返回空数组本身就是一个检测信号，表明可能是 headless 模式或非浏览器 HTTP 客户端。

### 屏幕和窗口尺寸

`window.outerWidth`/`outerHeight` 与 `window.innerWidth`/`innerHeight` 之间的差异代表浏览器 chrome（工具栏、滚动条、窗口边框）。Headless 浏览器通常报告零差异，因为它们没有可见的 UI。检测系统会将 `outerWidth` 等于 `innerWidth` 的客户端标记为可能的 headless。同样，`screen.width` 与 `innerWidth` 完全匹配表明这是一个最大化的 headless 窗口，而非正常的桌面会话。

`devicePixelRatio` 因显示器而异：标准显示器报告 `1.0`，MacBook Retina 显示屏报告 `2.0`，智能手机报告 `2.0` 到 `3.0`。此值应与 User-Agent 中声称的设备一致。

## User-Agent Client Hints

现代 Chromium 浏览器（Chrome、Edge、Opera）通过 Client Hints 标头补充传统的 User-Agent 字符串：`Sec-CH-UA`、`Sec-CH-UA-Platform`、`Sec-CH-UA-Mobile`，以及（按需提供的）更高熵值如 `Sec-CH-UA-Full-Version-List`、`Sec-CH-UA-Arch` 和 `Sec-CH-UA-Bitness`。

```http
Sec-CH-UA: "Chromium";v="120", "Google Chrome";v="120", "Not:A-Brand";v="99"
Sec-CH-UA-Mobile: ?0
Sec-CH-UA-Platform: "Windows"
```

Client Hints 提供结构化的、机器可读的数据，更难被不一致地伪造。服务器可以将 `Sec-CH-UA-Platform` 标头与 `navigator.platform`、User-Agent 字符串以及 TCP/IP 指纹进行比较。这些层之间的任何不一致都是检测信号。

JavaScript 端的等价物是 `navigator.userAgentData`，它将 `brands`、`mobile` 和 `platform` 作为低熵值暴露，并通过 `getHighEntropyValues()` 提供详细的版本、架构和位宽信息：

```javascript
// Low-entropy (always available, no permission needed)
console.log(navigator.userAgentData.brands);
// [{brand: "Chromium", version: "120"}, {brand: "Google Chrome", version: "120"}, ...]
console.log(navigator.userAgentData.platform); // "Windows"
console.log(navigator.userAgentData.mobile);   // false

// High-entropy (requires promise, may require permission)
const highEntropy = await navigator.userAgentData.getHighEntropyValues([
    'architecture', 'bitness', 'platformVersion', 'uaFullVersion'
]);
// {architecture: "x86", bitness: "64", platformVersion: "15.0.0", ...}
```

!!! warning "浏览器支持"
    Client Hints 是 Chromium 独有的功能。Firefox 和 Safari 不会发送 `Sec-CH-UA` 标头，也不会暴露 `navigator.userAgentData`。如果 User-Agent 声称是 Firefox，但服务器收到了 Client Hints 标头，那么该客户端不是 Firefox。

## Canvas Fingerprinting

Canvas fingerprinting 利用了 HTML5 Canvas API 在不同 GPU、图形驱动、操作系统和浏览器组合下产生微妙不同像素输出的特性。这种差异来自字体光栅化（亚像素渲染、字体微调、抗锯齿）、GPU 特定的着色器执行、图形管线中的浮点精度，以及操作系统级别的文本渲染库（Windows 上的 DirectWrite、macOS 上的 Core Text、Linux 上的 FreeType）。

该技术在隐藏的 canvas 上绘制文本、形状和渐变，提取像素数据，然后进行哈希处理：

```javascript
function generateCanvasFingerprint() {
    const canvas = document.createElement('canvas');
    canvas.width = 220;
    canvas.height = 30;
    const ctx = canvas.getContext('2d');

    // Colored rectangle (exposes blending differences)
    ctx.fillStyle = '#f60';
    ctx.fillRect(125, 1, 62, 20);

    // Text with emoji (maximizes rendering variation)
    ctx.font = '14px Arial';
    ctx.textBaseline = 'alphabetic';
    ctx.fillStyle = '#069';
    ctx.fillText('Cwm fjordbank glyphs vext quiz, 😃', 2, 15);

    // Semi-transparent overlay (exposes alpha compositing differences)
    ctx.fillStyle = 'rgba(102, 204, 0, 0.7)';
    ctx.fillText('Cwm fjordbank glyphs vext quiz, 😃', 4, 17);

    return canvas.toDataURL();
}
```

全字母句 "Cwm fjordbank glyphs vext quiz" 之所以被选用，是因为它使用了不常见的字符组合，能够充分测试字体渲染。表情符号增加了另一个维度，因为表情符号渲染在不同操作系统之间差异显著。半透明叠加测试了 alpha 合成，这在不同 GPU 实现之间也有所不同。

Canvas fingerprinting 能有效区分大类设备，但其唯一性有时被夸大了。Laperdrix 等人（2016）的研究发现，仅靠 canvas 指纹只能提供中等程度的区分能力，其真正价值在于与其他信号（WebGL、navigator 属性、时区）结合使用以实现高唯一性。

!!! note "Canvas 噪声注入"
    一些隐私工具会向 canvas 输出注入随机噪声以干扰 fingerprinting。检测系统通过在同一会话中多次请求 canvas 指纹来应对。如果哈希值在请求之间发生变化，则说明存在噪声注入，而这本身就是一个检测信号。因此，随机化 canvas 输出适得其反：它既不能防止识别，又暴露了反 fingerprinting 工具的使用。

由于 Pydoll 控制的是一个具有真实 GPU 渲染的 Chrome 实例，canvas 指纹是真实的，并且在多次读取之间保持一致。无需注入或伪造。

## WebGL Fingerprinting

WebGL fingerprinting 将 canvas fingerprinting 扩展到 3D 渲染管线。它更为强大，因为它直接暴露了难以伪造的硬件标识符。

最具辨识度的数据来自 `WEBGL_debug_renderer_info` 扩展，它揭示了 GPU 供应商和型号：

```javascript
function getWebGLFingerprint() {
    const canvas = document.createElement('canvas');
    const gl = canvas.getContext('webgl');
    if (!gl) return null;

    // GPU identification (most distinctive)
    const debugInfo = gl.getExtension('WEBGL_debug_renderer_info');
    const vendor = debugInfo
        ? gl.getParameter(debugInfo.UNMASKED_VENDOR_WEBGL)
        : gl.getParameter(gl.VENDOR);
    const renderer = debugInfo
        ? gl.getParameter(debugInfo.UNMASKED_RENDERER_WEBGL)
        : gl.getParameter(gl.RENDERER);

    return {
        vendor,    // e.g. "Google Inc. (NVIDIA)"
        renderer,  // e.g. "ANGLE (NVIDIA, NVIDIA GeForce RTX 3080 Direct3D11 vs_5_0 ps_5_0)"
        version: gl.getParameter(gl.VERSION),
        shadingLanguageVersion: gl.getParameter(gl.SHADING_LANGUAGE_VERSION),
        maxTextureSize: gl.getParameter(gl.MAX_TEXTURE_SIZE),
        extensions: gl.getSupportedExtensions(),
    };
}
```

renderer 字符串直接标明了 GPU 硬件。声称是移动设备的客户端却报告了桌面 GPU，这显然是不一致的。虚拟机通常报告软件渲染器如 "SwiftShader" 或 "llvmpipe"，这在真实用户中几乎不会出现。

除了元数据之外，WebGL 还可以渲染一个 3D 场景（例如一个渐变三角形）并对像素输出进行哈希，产生类似于 canvas fingerprinting 的渲染指纹，但针对的是 3D 管线。GPU 标识符、支持的扩展、参数限制（`MAX_TEXTURE_SIZE`、`MAX_VIEWPORT_DIMS`）和着色器精度格式的组合，创建了图形栈的详细指纹。

## AudioContext Fingerprinting

Web Audio API 通过处理音频并测量输出来生成指纹。标准技术是创建一个 `OscillatorNode`，将其路由通过一个 `DynamicsCompressorNode`，然后从 `AnalyserNode` 或 `OfflineAudioContext` 读取生成的音频采样。不同浏览器和操作系统音频栈在音频处理实现上的差异会产生不同的输出。

```javascript
function getAudioFingerprint() {
    const ctx = new OfflineAudioContext(1, 44100, 44100);
    const oscillator = ctx.createOscillator();
    oscillator.type = 'triangle';
    oscillator.frequency.setValueAtTime(10000, ctx.currentTime);

    const compressor = ctx.createDynamicsCompressor();
    compressor.threshold.setValueAtTime(-50, ctx.currentTime);
    compressor.knee.setValueAtTime(40, ctx.currentTime);
    compressor.ratio.setValueAtTime(12, ctx.currentTime);
    compressor.attack.setValueAtTime(0, ctx.currentTime);
    compressor.release.setValueAtTime(0.25, ctx.currentTime);

    oscillator.connect(compressor);
    compressor.connect(ctx.destination);
    oscillator.start(0);

    return ctx.startRendering().then(buffer => {
        const data = buffer.getChannelData(0);
        // Hash a subset of the audio samples
        let hash = 0;
        for (let i = 4500; i < 5000; i++) {
            hash += Math.abs(data[i]);
        }
        return hash;
    });
}
```

AudioContext fingerprinting 的部署范围不如 canvas 或 WebGL fingerprinting 广泛，但它为整体指纹增加了另一个维度。该信号对于区分同一操作系统上的不同浏览器特别有用，因为音频处理在不同浏览器引擎之间的差异比在不同操作系统版本之间更大。

## Battery Status API

Battery Status API（`navigator.getBattery()`）暴露了设备的电池电量、充电状态以及预估的充电/放电时间。这些值在会话持续期间创建了一个短暂但唯一的指纹。

此 API 仅在 Chromium 浏览器中可用。Firefox 在版本 52（2017 年）中出于隐私考虑将其移除，Safari 从未实现过。如果检测系统从声称是 Firefox 或 Safari 的客户端看到 Battery API 结果，就知道该客户端伪造了身份。

## HTTP 标头 Fingerprinting

除了 JavaScript API 之外，HTTP 标头提供了服务器在任何 JavaScript 执行之前就可见的 fingerprinting 信号。

### 标头顺序

浏览器以一致的、特定于版本的顺序发送 HTTP 标头。Chrome 将 `Sec-CH-UA` 标头放在较前的位置，位于 `User-Agent` 之前。Firefox 以 `User-Agent` 开头，随后是 `Accept` 和 `Accept-Language`。自动化 HTTP 库如 Python 的 `requests` 或 `httpx` 以另一种顺序发送标头，通常以 `Host` 和 `Connection` 开头。

检测系统记录前 10-15 个标头的顺序，并与已知的浏览器签名进行比较。即使所有单独的标头值都正确，以错误的顺序发送也会暴露该请求不是由所声称的浏览器生成的。由于 Pydoll 控制的是真实的 Chrome 实例，标头顺序是真实的。

### Accept-Encoding

现代浏览器除了 `gzip` 和 `deflate` 之外还支持 Brotli 压缩（`br`）。Chrome 还支持 `zstd`。现代 Chrome 的 `Accept-Encoding` 类似于 `gzip, deflate, br, zstd`。声称是 Chrome 但缺少 Brotli 的客户端要么是过时的，要么是自动化的。

### Accept-Language 一致性

`Accept-Language` 标头应与 `navigator.language`、`navigator.languages`、时区以及 IP 地理位置保持一致。来自东京 IP、时区为 `Asia/Tokyo` 的请求带有 `Accept-Language: en-US`，对于旅行者来说是合理的，但与其他信号结合时就显得可疑。来自中国数据中心 IP、带有 `Accept-Language: zh-CN` 和时区 `America/New_York` 的请求则是强烈的代理指标。

## 对 Pydoll 的影响

由于 Pydoll 通过 CDP 驱动真实的 Chromium 浏览器，所有浏览器级别的指纹默认都是真实的。Canvas、WebGL 和 AudioContext 指纹来自实际的 GPU 和音频硬件。Navigator 属性、插件和屏幕尺寸反映了真实的浏览器状态。HTTP 标头（包括其顺序）由 Chrome 的网络栈生成。

自动化中的主要风险是各层之间的不一致。设置自定义 User-Agent 而不同步相关属性会创建容易被检测到的不匹配。Pydoll 会自动处理这个问题：当它检测到浏览器参数中的 `--user-agent=` 时，会使用 `Emulation.setUserAgentOverride` 在所有层同步 User-Agent 字符串、平台和完整的 Client Hints 元数据。它还通过 `Page.addScriptToEvaluateOnNewDocument` 注入 `navigator.vendor` 和 `navigator.appVersion` 覆盖，以确保新打开的标签页中的一致性。

对于时区和地理位置一致性（以匹配代理 IP 的位置），JavaScript 覆盖可以设置 `Intl.DateTimeFormat().resolvedOptions().timeZone` 和 `Date.prototype.getTimezoneOffset`。`--lang` 标志和 `set_accept_languages()` 配置语言标头。`webrtc_leak_protection` 选项可防止 WebRTC 暴露代理背后的真实 IP。

总体原则是，Pydoll 提供真实的浏览器指纹作为基线，开发者只需确保可配置的层（User-Agent、时区、语言、地理位置）彼此一致，并与代理的特征相匹配。

## 参考文献

- Laperdrix, P., Rudametkin, W., & Baudry, B. (2016). Beauty and the Beast: Diverting Modern Web Browsers to Build Unique Browser Fingerprints. IEEE S&P.
- Mowery, K., & Shacham, H. (2012). Pixel Perfect: Fingerprinting Canvas in HTML5. USENIX Security.
- Eckersley, P. (2010). How Unique Is Your Web Browser? Privacy Enhancing Technologies Symposium.
- W3C Client Hints Infrastructure: https://wicg.github.io/client-hints-infrastructure/
- BrowserLeaks: https://browserleaks.com/
- CreepJS: https://abrahamjuliot.github.io/creepjs/


================================================
FILE: docs/zh/deep-dive/fingerprinting/evasion-techniques.md
================================================
# 规避技术

本文档介绍使用 Pydoll 规避 fingerprinting 检测的实用技术。前面几节分别描述了各层检测的工作原理：[网络 fingerprinting](./network-fingerprinting.md)（TCP/IP、TLS、HTTP/2）、[浏览器 fingerprinting](./browser-fingerprinting.md)（Canvas、WebGL、navigator 属性）以及[行为 fingerprinting](./behavioral-fingerprinting.md)（鼠标、键盘、滚动）。本节聚焦于反制措施。

核心原则是各层之间的一致性。通过了某一检测层却在另一层失败，仍然会被标记。住宅 IP 搭配不匹配的 TCP 指纹，或完美的浏览器指纹搭配机器人式的鼠标移动，都会被任何关联信号的系统捕获。

!!! info "模块导航"
    - [网络 Fingerprinting](./network-fingerprinting.md)：协议级识别
    - [浏览器 Fingerprinting](./browser-fingerprinting.md)：应用层检测
    - [行为 Fingerprinting](./behavioral-fingerprinting.md)：人类行为分析

## Pydoll 默认提供的能力

在配置任何东西之前，了解 Pydoll 通过 CDP 使用真实 Chrome 实例默认提供了什么非常有帮助。

**真实的网络指纹。** Chrome 的 TCP/IP 协议栈、TLS 实现（BoringSSL）和 HTTP/2 协议栈会产生真实的指纹。TLS ClientHello、HTTP/2 SETTINGS 帧、伪标头顺序和流优先级都与真实 Chrome 浏览器一致。以编程方式构造 HTTP 请求的工具（requests、httpx、curl）在这些层会产生非浏览器指纹。使用 Pydoll，这些默认就是真实的。

**真实的浏览器指纹。** Canvas、WebGL 和 AudioContext 指纹来自真实的 GPU 和音频硬件。Navigator 属性、插件（标准的 5 个 PDF 插件）和 MIME 类型反映真实的浏览器状态。这里无需任何配置。

**没有 `navigator.webdriver`。** Selenium、Playwright 和 Puppeteer 会将 `navigator.webdriver` 设置为 `true`。Pydoll 直接使用 CDP，不会设置此标志。该属性为 `undefined`，与正常用户会话一致。

**完整的事件序列。** 当 Pydoll 通过 CDP 的 Input 域分发输入事件时，Chrome 会生成完整的事件链（pointermove、pointerdown、mousedown、pointerup、mouseup、click），与真实用户输入完全一致。

## User-Agent 一致性

自动化中最常见的 fingerprinting 不一致是 HTTP `User-Agent` 标头、JavaScript 中的 `navigator.userAgent`、`navigator.platform` 以及 Client Hints 标头（`Sec-CH-UA`、`Sec-CH-UA-Platform`）之间的不匹配。仅设置 `--user-agent=` 作为 Chrome 标志只会更改 HTTP 标头，而 JavaScript 属性和 Client Hints 保持不变。

Pydoll 自动解决此问题。当它在浏览器参数中检测到 `--user-agent=` 时，会：

1. 解析 UA 字符串以提取浏览器名称、版本和操作系统。
2. 通过 CDP 调用 `Emulation.setUserAgentOverride`，包含完整的 `userAgent`、正确的 `platform` 值（例如 Windows 对应 `Win32`）以及完整的 `userAgentMetadata`（Client Hints 数据，包括 `Sec-CH-UA`、`Sec-CH-UA-Platform`、`Sec-CH-UA-Full-Version-List`）。
3. 通过 `Page.addScriptToEvaluateOnNewDocument` 注入 `navigator.vendor` 和 `navigator.appVersion` 覆盖，确保在新打开的标签页中也保持一致。

```python
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.add_argument(
    '--user-agent=Mozilla/5.0 (Windows NT 10.0; Win64; x64) '
    'AppleWebKit/537.36 (KHTML, like Gecko) '
    'Chrome/120.0.6099.109 Safari/537.36'
)

async with Chrome(options=options) as browser:
    tab = await browser.start()
    # 现在所有层都保持一致：
    # - HTTP User-Agent 标头
    # - navigator.userAgent / navigator.platform / navigator.appVersion
    # - Sec-CH-UA / Sec-CH-UA-Platform / Sec-CH-UA-Full-Version-List
    # - navigator.userAgentData.brands / .platform
    await tab.go_to('https://example.com')
```

此覆盖会自动应用于初始标签页、通过 `browser.new_tab()` 创建的新标签页，以及通过 `browser.get_opened_tabs()` 发现的所有标签页。

!!! note "支持的平台"
    UA 解析器支持 Chrome、Edge、Windows（NT 6.1 到 10.0）、macOS、Linux、Android、iOS 和 Chrome OS。它按照 Chromium 规范生成正确的 GREASE 品牌值。

## Timezone 和 Locale 一致性

使用 proxy 时，浏览器的 timezone 和语言应与 proxy IP 的地理位置匹配。一个定位到东京的 IP 配合 `America/New_York` 的浏览器 timezone 和 `Accept-Language: en-US` 是可被检测的不一致。

### 语言配置

语言通过 Chrome 标志和 Pydoll 的选项 API 配置：

```python
options = ChromiumOptions()
options.add_argument('--lang=ja-JP')
options.set_accept_languages('ja-JP,ja;q=0.9,en;q=0.8')
```

这会同时设置 `Accept-Language` HTTP 标头以及 `navigator.language` / `navigator.languages`。

### Timezone 覆盖

Pydoll 目前没有封装 CDP 的 `Emulation.setTimezoneOverride` 命令，因此 timezone 覆盖需要 JavaScript 注入。需要覆盖的关键 API 是 `Intl.DateTimeFormat().resolvedOptions().timeZone` 和 `Date.prototype.getTimezoneOffset()`：

```python
async def set_timezone(tab, timezone_id: str, offset_minutes: int):
    """
    通过 JavaScript 覆盖 timezone。

    Args:
        timezone_id: IANA timezone 名称（例如 'Asia/Tokyo'）
        offset_minutes: UTC 偏移量，以分钟为单位（例如 JST 为 -540）
    """
    script = f'''
        const _origDTF = Intl.DateTimeFormat;
        Intl.DateTimeFormat = function(...args) {{
            const opts = args[1] || {{}};
            opts.timeZone = '{timezone_id}';
            return new _origDTF(args[0], opts);
        }};
        Object.defineProperty(Intl.DateTimeFormat, 'prototype', {{
            value: _origDTF.prototype
        }});
        Date.prototype.getTimezoneOffset = function() {{ return {offset_minutes}; }};
    '''
    await tab.execute_script(script)
```

!!! warning "`execute_script` 与 `addScriptToEvaluateOnNewDocument`"
    `tab.execute_script()` 在当前页面上下文中运行 JavaScript。如果页面导航，覆盖就会丢失。对于需要在导航间持久保持的覆盖，请使用 CDP 的 `Page.addScriptToEvaluateOnNewDocument`，它会在每次新文档加载时、在任何页面 JavaScript 运行之前注入脚本。Pydoll 内部对 User-Agent 覆盖就使用了此方法。对于 timezone，你可以直接发送 CDP 命令：

    ```python
    await tab._connection_handler.execute_command(
        'Page.addScriptToEvaluateOnNewDocument',
        {'source': script}
    )
    ```

### Geolocation 覆盖

对于请求地理位置权限的网站，可以通过 JavaScript 覆盖 Geolocation API：

```python
async def set_geolocation(tab, latitude: float, longitude: float):
    script = f'''
        navigator.geolocation.getCurrentPosition = function(success) {{
            success({{
                coords: {{
                    latitude: {latitude}, longitude: {longitude},
                    accuracy: 1, altitude: null, altitudeAccuracy: null,
                    heading: null, speed: null
                }},
                timestamp: Date.now()
            }});
        }};
        navigator.geolocation.watchPosition = function(success) {{
            return navigator.geolocation.getCurrentPosition(success);
        }};
    '''
    await tab.execute_script(script)
```

## WebRTC 泄露防护

WebRTC 可以通过绕过 proxy 隧道的 STUN/TURN 服务器请求，暴露客户端的真实 IP 地址，即使使用了 proxy。Pydoll 提供了内置选项来防止这种情况：

```python
options = ChromiumOptions()
options.webrtc_leak_protection = True
# 添加：--force-webrtc-ip-handling-policy=disable_non_proxied_udp
```

这会强制 Chrome 将所有 WebRTC 流量通过 proxy 路由，防止 IP 泄露。在使用 proxy 进行隐蔽自动化时应始终启用此选项。

## 行为 humanize

Pydoll 通过 `humanize=True` 参数为鼠标、键盘和滚动实现了 humanize 交互。这些不是未来功能或手动变通方案，而是框架内置的功能。

### 鼠标

```python
# humanize 点击：贝塞尔曲线路径、Fitts 定律计时、
# 最小加加速度速度曲线、颤动、过冲 + 修正
await element.click(humanize=True)
```

当 `humanize=True` 传递给 WebElement 的 `click()` 时，Pydoll 会生成一条从当前光标位置到元素的完整鼠标移动路径，使用带有随机控制点的三次贝塞尔曲线。速度遵循最小加加速度曲线。会添加生理性颤动、过冲（70% 概率）和微暂停。移动持续时间根据 Fitts 定律基于距离和目标大小计算。详细参数描述请参见[行为 Fingerprinting](./behavioral-fingerprinting.md#pydolls-mouse-humanization)。

### 键盘

```python
# humanize 打字：可变延迟、逼真的错别字（约 2%）、
# 标点停顿、思考停顿、分心停顿
await element.type_text("Hello, world!", humanize=True)
```

humanize 打字使用可变的按键间延迟（30-120ms 均匀分布）、标点停顿、思考停顿（2% 概率）、分心停顿（0.5% 概率），以及具有五种不同错误类型和自然修正序列的逼真错别字。完整参数说明请参见[行为 Fingerprinting](./behavioral-fingerprinting.md#pydolls-keyboard-humanization)。

### 滚动

```python
from pydoll.interactions.scroll import Scroll, ScrollPosition

scroll = Scroll(connection_handler)
# humanize 滚动：贝塞尔缓动、抖动、微暂停、过冲
await scroll.by(ScrollPosition.Y, 800, humanize=True)
```

humanize 滚动使用贝塞尔缓动曲线、逐帧抖动（±3px）、微暂停（5% 概率）和过冲修正（15% 概率）。大距离会被拆分为多个"轻弹"手势。详情请参见[行为 Fingerprinting](./behavioral-fingerprinting.md#pydolls-scroll-humanization)。

## 请求拦截

Pydoll 通过 CDP 的 Fetch 域支持请求拦截，允许你在请求到达服务器之前修改标头、阻止请求或提供自定义响应：

```python
from pydoll.protocol.fetch.events import FetchEvent

async def handle_request(event):
    request_id = event['params']['requestId']
    request = event['params']['request']
    headers = request.get('headers', {})

    # 示例：确保声明了 Brotli 支持
    if 'Accept-Encoding' in headers and 'br' not in headers['Accept-Encoding']:
        headers['Accept-Encoding'] = 'gzip, deflate, br, zstd'

    header_list = [{'name': k, 'value': v} for k, v in headers.items()]
    await tab.continue_request(request_id=request_id, headers=header_list)

await tab.enable_fetch_events()
await tab.on(FetchEvent.REQUEST_PAUSED, handle_request)
```

实际上，使用 Pydoll 很少需要修改标头，因为 Chrome 本身就会生成正确的标头。请求拦截更适用于阻止追踪脚本、修改响应内容或调试。

## 浏览器偏好设置增强真实性

Chrome 存储的用户偏好设置可以被 fingerprinting 系统检查。一个全新的浏览器配置文件——没有历史记录、没有保存的偏好设置、一切都是默认值——看起来与已使用数周的配置文件不同。Pydoll 的 `browser_preferences` 选项允许你预填充这些设置：

```python
import time

options = ChromiumOptions()
options.browser_preferences = {
    'profile': {
        'created_by_version': '120.0.6099.130',
        'creation_time': str(time.time() - 90 * 86400),  # 90 天前
        'exit_type': 'Normal',
    },
    'profile.default_content_setting_values': {
        'cookies': 1,
        'images': 1,
        'javascript': 1,
        'notifications': 2,  # "询问"（真实的默认值）
    },
}
```

## 常见错误

### 随机化一切

从头生成随机指纹（随机 hardwareConcurrency、随机 deviceMemory、随机屏幕尺寸）会产生不可能的组合。真实设备有受约束的配置：4 核、8 GB RAM、1920x1080 屏幕、Windows 10 是一个合理的配置。17 核、0.5 GB RAM、3840x2160 屏幕、`navigator.platform: Linux armv7l` 则不是。请使用从真实浏览器捕获的配置文件，而不是随机生成。

### Canvas 噪声注入

向 Canvas 输出添加随机噪声来防止 fingerprinting 会适得其反。检测系统会多次请求指纹。如果哈希值在请求之间发生变化，噪声注入就会被检测到，这本身就是一个强烈的自动化信号。使用 Pydoll，Canvas 指纹是真实且一致的。不要去动它。

### 过时的 User-Agent

使用 6 个月以上的浏览器版本的 User-Agent 是可被检测的，因为该版本缺少当前发行版应有的功能和 Client Hints 值。User-Agent 字符串应保持在最近 2-3 个 Chrome 主要版本之内。

### 忽略会话级行为

即使有完美的指纹和 humanize 的交互，会话级行为仍然很重要。在 60 秒内加载 100 个页面、从不滚动、只点击按钮（从不点击链接）、以及在没有任何标签页切换或空闲期的情况下保持数小时的持续焦点，这些都是行为异常。在导航之间添加阅读延迟，变化多页面工作流的节奏，并包含自然的空闲期。

## 验证

在大规模部署自动化之前，使用以下工具验证你的指纹：

| 工具 | URL | 测试内容 |
|------|-----|----------|
| BrowserLeaks | https://browserleaks.com/ | Canvas、WebGL、字体、IP、WebRTC、HTTP/2 |
| CreepJS | https://abrahamjuliot.github.io/creepjs/ | 欺骗检测、一致性检查 |
| Fingerprint.com | https://fingerprint.com/demo/ | 商业级识别 |
| PixelScan | https://pixelscan.net/ | 机器人检测分析 |
| IPLeak | https://ipleak.net/ | WebRTC、DNS、IP 泄露 |

使用 Pydoll 的基本验证脚本：

```python
async def verify_fingerprint(tab):
    result = await tab.execute_script('''
        return {
            userAgent: navigator.userAgent,
            platform: navigator.platform,
            webdriver: navigator.webdriver,
            languages: navigator.languages,
            plugins: navigator.plugins.length,
            timezone: Intl.DateTimeFormat().resolvedOptions().timeZone,
            colorDepth: screen.colorDepth,
            deviceMemory: navigator.deviceMemory,
            hardwareConcurrency: navigator.hardwareConcurrency,
        };
    ''')
    fp = result['result']['result']['value']

    # 检查明显问题
    assert fp['webdriver'] is None, 'navigator.webdriver should be undefined'
    assert fp['plugins'] == 5, f'Expected 5 plugins, got {fp["plugins"]}'
    assert 'HeadlessChrome' not in fp['userAgent'], 'Headless detected in UA'
```

## 参考资料

- Chrome DevTools Protocol, Emulation Domain: https://chromedevtools.github.io/devtools-protocol/tot/Emulation/
- Chrome DevTools Protocol, Fetch Domain: https://chromedevtools.github.io/devtools-protocol/tot/Fetch/
- Chromium Source, Inspector Emulation Agent: https://source.chromium.org/chromium/chromium/src/+/main:third_party/blink/renderer/core/inspector/inspector_emulation_agent.cc


================================================
FILE: docs/zh/deep-dive/fingerprinting/index.md
================================================
# 浏览器与网络指纹

本模块涵盖浏览器和网络指纹，这是现代 Web 自动化和检测系统的关键方面。

指纹技术处于网络协议、密码学、浏览器内部原理和行为分析的交叉点。它包含了用于在会话间识别和跟踪设备、浏览器和用户，而不依赖于 Cookie 或 IP 地址等传统标识符的技术。

## 为何如此重要

浏览器与网站的每一次连接都会暴露多种特征，从网络数据包中 TCP 选项的精确顺序，到特定 GPU 的 canvas 渲染，再到 JavaScript 执行计时模式。单独来看，这些特征可能显得无害。但结合起来，它们会创建一个能够唯一识别设备或浏览器实例的指纹。

对于自动化工程师、机器人开发者和注重隐私的用户来说，理解指纹对于构建有效的检测规避系统和在技术层面理解跟踪机制的运作至关重要。

!!! danger "多层检测系统"
    现代反机器人系统跨越多个层面进行综合分析：
    
    - **网络层面**：TCP/IP 协议栈行为、TLS 握手模式、HTTP/2 设置
    - **浏览器层面**：Canvas 渲染、WebGL 供应商字符串、JavaScript 属性枚举
    - **行为层面**：鼠标移动熵、按键计时、滚动模式
    
    一个单一的不一致（例如 Chrome User-Agent 却带有 Firefox 的 TLS 指纹）就可能触发立即阻止。

## 模块范围与方法论

指纹技术的文档分散在多个来源中，其可访问性和可靠性各不相同：

- 学术论文（通常有付费墙且偏于理论）
- 浏览器源代码（数百万行代码需要分析）
- 安全研究人员的博客（技术性强但零散）
- 反机器人供应商的白皮书（以营销为中心，省略细节）
- 地下论坛（实用但不可靠）

本模块将这些知识集中、验证并组织成一个有凝聚力的技术指南。这里描述的每一种技术都经过了：

- **验证**：对照浏览器源代码和 RFCs
- **测试**：在真实的自动化场景中
- **引用**：附有权威参考资料
- **解释**：从基本原理到实现

## 模块结构

本模块分为三个渐进的层次，从网络基础到实用的规避技术：

### 1. 网络级指纹
**[网络指纹](./network-fingerprinting.md)**

涵盖在浏览器渲染开始之前，通过传输层和会话层的网络行为进行设备识别。

- **TCP/IP 指纹**：TTL、窗口大小、选项顺序
- **TLS 指纹**：JA3/JA4、密码套件、ALPN 协商
- **HTTP/2 指纹**：SETTINGS 帧、优先级模式
- **工具与技术**：p0f、Nmap、Scapy、tshark 分析

**技术意义**：网络指纹是最难伪造的，因为它们需要操作系统级别的修改。在 JavaScript 执行开始之前，这一层的不一致就会被检测到。

### 2. 浏览器级指纹
**[浏览器指纹](./browser-fingerprinting.md)**

在应用层检查通过 JavaScript API、渲染引擎和插件生态系统进行的浏览器识别。

- **Canvas & WebGL 指纹**：特定 GPU 的渲染伪影
- **音频指纹**：音频 API 输出的细微差异
- **字体枚举**：已安装字体揭示操作系统和区域设置
- **JavaScript 属性**：Navigator 对象、屏幕尺寸、时区
- **标头分析**：Accept-Language、User-Agent 一致性

**技术意义**：这一层占了大多数检测事件。即使网络级指纹正确，暴露的自动化属性（例如 `navigator.webdriver`）也会触发阻止。

### 3. 行为指纹
**[行为指纹](./behavioral-fingerprinting.md)**

分析用户交互模式，以区分人类行为和自动化系统。

- **鼠标移动分析**：轨迹曲率、速度分布、菲茨定律合规性
- **按键动力学**：打字节奏、停留时间、飞行时间、二元组模式
- **滚动模式**：动量、惯性、减速曲线
- **事件序列**：自然的交互顺序 (mousemove → click)、计时分析
- **机器学习**：在数十亿行为信号上训练的 ML 模型

**技术意义**：即使网络和浏览器指纹被正确伪造，行为分析也能检测到自动化。这一层尤其具有挑战性，因为它需要复制生物力学的人类行为模式。

### 4. 规避技术
**[规避技术](./evasion-techniques.md)**

使用 Pydoll 的 CDP 集成、JavaScript 覆盖和架构特性，实际实现指纹规避。

- **基于 CDP 的伪造**：时区、地理位置、设备指标
- **JavaScript 属性覆盖**：重新定义 navigator 对象、canvas 投毒
- **请求拦截**：强制标头一致性
- **行为模拟**：类人计时、熵注入
- **检测测试**：用于验证您的规避设置的工具

**技术意义**：本节演示了将指纹概念实际应用于真实自动化场景，整合了前面所有层次的技术。

## 谁应该阅读本文

### **如果您符合以下情况，您必须阅读本文：**
- 正在构建与受反机器人保护的网站进行交互的自动化
- 正在大规模开发抓取基础设施
- 正在实施保护隐私的浏览器自动化
- 正在出于攻击或防御目的研究机器人检测

### **如果您符合以下情况，这是高级材料：**
- 刚接触网络协议（从 [网络基础](../network/network-fundamentals.md) 开始）
- 不熟悉 CDP（请先阅读 [Chrome 开发者工具协议](../fundamentals/cdp.md)）
- 刚开始学习 Python 类型（请参阅 [类型系统](../fundamentals/typing-system.md)）

### **本文不是：**
- “银弹” 般的反检测解决方案（不存在这种东西）
- 关于网络抓取的法律建议（请咨询 [法律与道德](../network/proxy-legal.md)）
- 替代遵守 robots.txt 和速率限制的方案

## 技术理念

指纹防御 **不是要变得隐形**——而是要变得 **与合法流量无法区分**。这意味着：

1.  **一致性优于完美性**：一个配置完美的 Firefox 指纹胜过一个“完美”但不一致的 Chrome 指纹
2.  **整体方法**：您必须统一网络、浏览器和行为层面
3.  **持续适应**：指纹技术每月都在演变；这是一份动态文档

!!! tip "黄金法则"
    **每一层都必须讲述同一个故事。** 如果您的 TLS 指纹显示“Chrome 120”，您的 HTTP/2 设置必须匹配 Chrome 120，您的 User-Agent 必须显示 Chrome 120，并且您的 canvas 渲染必须产生 Chrome 120 的伪影。一个不匹配 = 被检测。

## 伦理考量

指纹知识是 **双重用途技术**：

- **防御性**：保护您的隐私免受侵入性跟踪
- **攻击性**：规避检测系统以实现自动化

我们相信您会 **负责任地、合乎道德地** 使用这些知识：

**推荐实践：**
- 尊重网站的服务条款
- 实施速率限制和友好的爬行模式
- 评估自动化是否必要
- 在适当的时候保持透明

**禁止用途：**
- 欺诈、账户滥用或非法活动
- 以侵略性的抓取压垮服务器
- 在不了解后果的情况下将这些知识武器化

## 准备好深入探索了吗？

指纹是一个复杂且技术性强的领域，需要系统性学习。在有检测系统的环境中，理解这些技术对于有效的 Web 自动化至关重要。

从 **[网络指纹](./network-fingerprinting.md)** 开始建立基础知识，继续学习 **[浏览器指纹](./browser-fingerprinting.md)** 以理解应用层，最后以 **[规避技术](./evasion-techniques.md)** 结束以进行实际部署。

---

!!! info "文档状态"
    本模块代表了结合学术论文、浏览器源代码、真实世界测试和社区知识的 **广泛研究**。每一项声明都经过引用和验证。如果您发现不准确之处或有更新，欢迎贡献。

## 进一步阅读

在深入之前，请考虑以下补充主题：

- **[代理架构](../network/http-proxies.md)**：网络级匿名基础
- **[浏览器偏好设置](../../features/configuration/browser-preferences.md)**：实用的指纹配置
- **[行为验证码绕过](../../features/advanced/behavioral-captcha-bypass.md)**：行为分析与规避

================================================
FILE: docs/zh/deep-dive/fingerprinting/network-fingerprinting.md
================================================
# Network Fingerprinting

Network fingerprinting 通过分析 TCP/IP 协议栈、TLS 握手和 HTTP/2 连接的特征来识别客户端。这些信号由操作系统内核和 TLS 库设定，而非浏览器的 JavaScript 环境，因此比浏览器层面的指纹更难伪造。代理或 VPN 可以更改你的 IP 地址，但无法改变你的 TCP 窗口大小、TLS cipher suite 列表或 HTTP/2 SETTINGS 帧。检测系统正是利用了这一差异。

!!! info "模块导航"
    - [Browser Fingerprinting](./browser-fingerprinting.md)：Canvas、WebGL、AudioContext
    - [Evasion Techniques](./evasion-techniques.md)：多层对抗措施

    有关协议基础知识，请参阅 [Network Fundamentals](../network/network-fundamentals.md)。有关代理检测的背景知识，请参阅 [Proxy Detection](../network/proxy-detection.md)。

## TCP/IP Fingerprinting

每个操作系统对 TCP/IP 协议栈的实现方式各不相同。发起 TCP 连接的 SYN 数据包携带了足够的信息来高置信度地识别操作系统：初始 TTL、TCP 窗口大小、最大报文段长度（MSS）以及 TCP 选项的顺序和选择。这些值均不受浏览器控制，它们全部来自内核。

### TTL (Time To Live)

初始 TTL 是最简单的操作系统标识符之一。Linux 和 macOS 将其设为 64，Windows 设为 128，网络设备（路由器、防火墙）通常使用 255。每经过一个路由器跳点，TTL 递减 1，因此一个到达时 TTL 为 118 的数据包很可能起始于 128（Windows），经过了 10 个跳点。

TTL 的 fingerprinting 价值在于将其与 User-Agent 进行交叉验证。如果浏览器声称是 Windows 上的 Chrome，但数据包到达时的 TTL 接近 64，那么该连接要么是通过 Linux 服务器代理的，要么 User-Agent 被伪造了。检测系统会将观察到的 TTL 向上取整到最近的已知初始值（64、128、255），然后与声称的操作系统进行比对。

当流量经过代理时，TTL 会被重置，因为代理的内核会生成一个新的 TCP 连接到目标。目标看到的是代理的 TTL，而不是你的。这就是为什么 TTL 不匹配是代理检测信号：User-Agent 声称是 Windows（TTL 128），但 TCP 指纹显示的是 Linux（TTL 64）。

### TCP 窗口大小和缩放

SYN 数据包中的初始 TCP 窗口大小因操作系统和内核版本而异。现代 Linux 内核（3.x 及更高版本）通常发送 29200 字节的初始窗口，即 `20 * MSS`（标准以太网的 MSS 为 1460）。某些较新的内核（5.x、6.x）根据配置和 `initcwnd` 设置可能使用 64240。Windows 10 和 11 通常发送 65535 并启用窗口缩放，但确切值取决于自动调优配置和补丁级别。macOS 也默认为 65535。

窗口缩放因子（一个 TCP 选项）将 16 位窗口大小字段进行乘法运算以支持更大的接收窗口。Linux 通常使用缩放因子 7（允许最大 8MB 的窗口），而 Windows 通常使用 8。结合基础窗口大小，缩放因子创建出比单独任何一个值都更精细的指纹。

### TCP 选项顺序

SYN 数据包中 TCP 选项的选择和排列顺序具有高度辨识度。每个操作系统按固定的、版本特定的顺序排列选项，且内核不将其作为可配置参数暴露。Linux 发送 `MSS, SACK_PERM, TIMESTAMP, NOP, WSCALE`。Windows 发送 `MSS, NOP, WSCALE, NOP, NOP, SACK_PERM`，并且在默认配置中明显省略了 TIMESTAMP 选项。macOS 发送 `MSS, NOP, WSCALE, NOP, NOP, TIMESTAMP, SACK_PERM`。

特定选项的有无与顺序同样重要。Windows 历史上省略了 TCP 时间戳，而 Linux 和 macOS 默认包含它。所有现代系统都支持 SACK（选择性确认），但某些旧版或嵌入式系统可能不会通告它。哪些选项出现以及它们的顺序组合起来形成一个签名，p0f 等工具会将其与已知操作系统指纹数据库进行匹配。

### p0f

[p0f](https://lcamtuf.coredump.cx/p0f3/) 是被动 TCP/IP fingerprinting 的标准工具。它在不生成任何数据包的情况下观察流量，分析 SYN 和 SYN+ACK 数据包并与签名数据库进行比对。其签名格式编码了关键的 fingerprinting 字段：

```
version:ittl:olen:mss:wsize,scale:olayout:quirks:pclass
```

`ittl` 是推断的初始 TTL，`mss` 是最大报文段长度，`wsize,scale` 是窗口大小（可以是绝对值，也可以是相对于 MSS 的值，如 `mss*20`），`olayout` 是使用简写名称（`mss`、`nop`、`ws`、`sok`、`sack`、`ts`、`eol+N`）表示的 TCP 选项布局。`quirks` 字段捕获异常行为，如 Don't Fragment 标志（`df`）或 DF 数据包上的非零 IP ID（`id+`）。

典型的 Linux 4.x+ 签名在 p0f 中看起来像 `4:64:0:*:mss*20,7:mss,sok,ts,nop,ws:df,id+:0`。Windows 10 的签名可能看起来像 `4:128:0:*:65535,8:mss,nop,ws,nop,nop,sok:df,id+:0`。反机器人服务在内部维护类似的数据库，将传入连接与已知操作系统配置文件进行匹配，并标记与声明的 User-Agent 不一致的情况。

## TLS Fingerprinting

TLS ClientHello 消息在加密建立之前传输，因此对网络路径上的任何观察者都是可见的。它包含 TLS 版本、支持的 cipher suites、TLS 扩展、支持的椭圆曲线（命名组）和 EC 点格式。每个浏览器和 TLS 库都会产生这些字段的特征组合。

### JA3

JA3 由 Salesforce 的 John Althouse、Jeff Atkinson 和 Josh Atkins 开发，是第一个被广泛采用的 TLS fingerprinting 方法。它将 ClientHello 中的五个字段（TLS 版本、cipher suites、扩展、椭圆曲线、EC 点格式）连接起来，每个字段内的值用连字符连接，五个字段之间用逗号分隔，然后对结果字符串取 MD5 哈希。

```
JA3 string: 771,4865-4866-4867-49195-49199-49196-49200-52393-52392,0-23-65281-10-11-35-16-5-13-18-51-45-43-27-17513,29-23-24,0
JA3 hash:   cd08e31494b9531f560d64c695473da9
```

有一个细微之处：JA3 中的"TLS 版本"字段使用的是 `ClientHello.legacy_version`，而不是 `supported_versions` 扩展。由于 TLS 1.3（RFC 8446）要求客户端为了向后兼容将 `legacy_version` 设为 `0x0303`（TLS 1.2），因此对于现代客户端，JA3 的版本字段几乎总是 `771`，即使它们支持 TLS 1.3。实际的 TLS 1.3 协商通过扩展 43（`supported_versions`）进行，但 JA3 使用的是头部字段。

JA3 在哈希之前必须过滤 GREASE 值。GREASE（RFC 8701）是一种机制，浏览器会将随机选择的保留值插入 cipher suites、扩展和其他字段中，以防止协议僵化。有效的 GREASE 值为 `0x0a0a`、`0x1a1a`、`0x2a2a`，以此类推直到 `0xfafa`。每个值都有两个相同的字节，其中每个字节的低半字节为 `0x0a`。正确的 GREASE 过滤器需要检查两个条件：

```python
def is_grease(value: int) -> bool:
    return (value & 0x0f0f) == 0x0a0a and (value >> 8) == (value & 0xff)
```

!!! warning "JA3 在现代浏览器中的局限性"
    自 Chrome 110（2023 年 1 月）和 Firefox 114 起，浏览器会在每次连接时随机化 TLS 扩展的顺序。这意味着同一个浏览器在每次连接时会产生不同的 JA3 哈希，使得 JA3 对于识别现代浏览器实际上已经失效。JA3 对于 fingerprinting 非浏览器客户端（Python `requests`、`curl`、自定义机器人）仍然有用，因为这些客户端不实现扩展随机化。

### JA4

JA4 是 JA3 的继任者，由同一位主要作者（John Althouse）在 FoxIO 开发。它专门设计用于应对 TLS 扩展随机化，通过在哈希之前对扩展和 cipher suites 进行排序来实现。其格式由三个部分组成，以下划线分隔：`a_b_c`。

`a` 部分是人类可读的元数据字符串：协议（`t` 代表 TCP，`q` 代表 QUIC），TLS 版本（`12` 或 `13`），是否存在 SNI（`d` 代表域名，`i` 代表 IP），cipher suites 的数量（两位数），扩展的数量（两位数），以及第一个和最后一个 ALPN 值（`h2` 代表 HTTP/2，`00` 代表无）。例如，`t13d1516h2` 表示 TCP TLS 1.3 带 SNI，15 个 cipher suites，16 个扩展，以及 HTTP/2 ALPN。

`b` 部分是排序后的 cipher suites 的截断 SHA-256 哈希。`c` 部分是排序后的扩展与签名算法连接后的截断 SHA-256 哈希。因为两个列表在哈希之前都经过排序，所以扩展随机化不会影响输出。

Cloudflare、AWS 和其他主要平台已采用 JA4。完整的 JA4+ 套件还包括 JA4S（服务器 fingerprinting）、JA4H（HTTP 客户端 fingerprinting）、JA4X（X.509 证书 fingerprinting）和 JA4SSH（SSH fingerprinting）。规范和工具可在 [github.com/FoxIO-LLC/ja4](https://github.com/FoxIO-LLC/ja4) 获取。

### JA3S（服务器 Fingerprinting）

JA3S 将相同的概念应用于 ServerHello 消息，但格式更简单，因为服务器选择的是单个 cipher suite 而非提供一个列表。JA3S 字符串为 `version,cipher,extensions`，其 MD5 哈希标识了服务器的 TLS 实现。将 JA3（或 JA4）与 JA3S 配对可以创建双向指纹：特定客户端与特定服务器通信会产生可预测的 JA3+JA3S 对，这比单独任何一个指纹都更具辨识度。

### 代理如何影响 TLS 指纹

代理的类型决定了 TLS 指纹是否被保留。SOCKS5 代理和 HTTP CONNECT 隧道在不终止 TLS 的情况下中继 TCP 流，因此目标服务器看到的是原始客户端的 TLS 指纹，不会发生任何变化。这是这些代理类型在保持指纹一致性方面的主要优势。

MITM 代理（终止 TLS 并与目标重新建立新连接）会用自身的 TLS 指纹替换客户端的指纹。目标看到的是代理软件的 cipher suites 和扩展，而不是浏览器的。如果代理使用标准 TLS 库（如 OpenSSL 或 BoringSSL）的默认设置，指纹将不匹配任何已知浏览器，这本身就是一个检测信号。

这就是为什么 Pydoll 使用 `--proxy-server`（创建 CONNECT 隧道，保留浏览器的 TLS 指纹）的方式优于外部 MITM 代理设置来进行隐蔽自动化。

## HTTP/2 Fingerprinting

HTTP/2 连接暴露了一组与 TLS 不同的独立 fingerprinting 信号。客户端发送的第一个帧是 SETTINGS 帧，包含 `HEADER_TABLE_SIZE`、`ENABLE_PUSH`、`MAX_CONCURRENT_STREAMS`、`INITIAL_WINDOW_SIZE`、`MAX_FRAME_SIZE` 和 `MAX_HEADER_LIST_SIZE` 等参数。每个浏览器使用不同的默认值，并包含这些参数的不同子集。

除了 SETTINGS 之外，WINDOW_UPDATE 帧大小、初始流的优先级/权重以及 HTTP/2 伪头部（`:method`、`:authority`、`:scheme`、`:path`）的顺序在不同实现之间也各不相同。Chrome、Firefox 和 Safari 各自产生独特的这些值的组合。

Akamai 在 2017 年欧洲 Black Hat 大会上发表了关于 HTTP/2 fingerprinting 的基础性研究。他们的指纹格式连接了 SETTINGS 值、WINDOW_UPDATE 大小、PRIORITY 帧和伪头部顺序。JA4+ 套件中的 `JA4H` 用于 HTTP 层 fingerprinting，涵盖了头部顺序和值。

HTTP/2 fingerprinting 对自动化工具特别有效，因为许多机器人框架和 HTTP 库实现了自己的 HTTP/2 协议栈，其默认参数与任何真实浏览器都不匹配。即使工具正确伪造了 TLS 指纹（使用 curl-impersonate 或类似工具），其 HTTP/2 SETTINGS 帧也可能暴露它。

你可以在 [browserleaks.com/http2](https://browserleaks.com/http2) 检查你的 HTTP/2 指纹。因为 Pydoll 通过 CDP 控制真实的 Chrome 实例，HTTP/2 指纹始终是真实的——这是相对于以编程方式构建 HTTP 请求的工具的固有优势。

## 对浏览器自动化的影响

对于使用 Pydoll 进行自动化的实际要点是：network fingerprinting 是控制真实浏览器能提供显著优势的领域。Chrome 的 TCP/IP 协议栈、TLS 实现（BoringSSL）和 HTTP/2 协议栈默认产生真实的指纹。主要风险在于环境不匹配：在 Linux 服务器上运行 Chrome 而 User-Agent 声称是 Windows，会导致 TCP/IP 指纹不一致（TTL 为 64 而非 128，Linux TCP 选项顺序而非 Windows 的）。

对于基于代理的设置，指纹流程是：你的机器的 TCP/IP 协议栈生成到代理的连接（代理的运营商可以看到但目标无法看到），代理的 TCP/IP 协议栈生成到目标的连接。目标看到的是代理服务器的 TTL 和 TCP 选项。如果代理运行 Linux（大多数都是），无论 User-Agent 如何，TCP 指纹都将显示 Linux。这是一个众所周知的检测信号，住宅代理可以部分缓解（代理端点是真实用户的机器，因此其 TCP 指纹是合理的），但数据中心代理无法做到。

另一方面，TLS 和 HTTP/2 指纹通过 SOCKS5 和 CONNECT 隧道不做修改地传递。这些是浏览器的指纹，不是代理的。因此，通过 CONNECT 隧道使用 Pydoll 时，目标看到的是真实的 Chrome TLS 和 HTTP/2 指纹，配合代理的 TCP/IP 指纹。这种组合与真实用户通过 VPN 或企业代理浏览是一致的，这是一种常见且合理的模式。

## 参考资料

- Salesforce Engineering: TLS Fingerprinting with JA3 and JA3S - https://engineering.salesforce.com/tls-fingerprinting-with-ja3-and-ja3s-247362855967/
- FoxIO JA4+ Network Fingerprinting - https://github.com/FoxIO-LLC/ja4
- Cloudflare: JA4 Signals - https://blog.cloudflare.com/ja4-signals/
- Akamai: Passive Fingerprinting of HTTP/2 Clients (Black Hat EU 2017) - https://blackhat.com/docs/eu-17/materials/eu-17-Shuster-Passive-Fingerprinting-Of-HTTP2-Clients-wp.pdf
- p0f v3: Passive OS Fingerprinting - https://lcamtuf.coredump.cx/p0f3/
- RFC 8446: TLS 1.3 - https://datatracker.ietf.org/doc/html/rfc8446
- RFC 8701: GREASE for TLS - https://datatracker.ietf.org/doc/html/rfc8701
- RFC 6528: Defending against Sequence Number Attacks - https://datatracker.ietf.org/doc/html/rfc6528
- BrowserLeaks HTTP/2 Fingerprint - https://browserleaks.com/http2
- Stamus Networks: JA3 Fingerprints Fade as Browsers Embrace Extension Randomization - https://www.stamus-networks.com/blog/ja3-fingerprints-fade-browsers-embrace-tls-extension-randomization


================================================
FILE: docs/zh/deep-dive/fundamentals/cdp.md
================================================
# Chrome 开发者工具协议 (CDP)

Chrome 开发者工具协议 (CDP) 是 Pydoll 能够在没有传统 webdriver 的情况下控制浏览器的基础。理解 CDP 的工作原理有助于深入了解 Pydoll 的功能和内部架构。


## 什么是 CDP？

Chrome 开发者工具协议是 Chromium 团队开发的一个强大接口，允许通过编程方式与基于 Chromium 的浏览器进行交互。它与您检查网页时 Chrome 开发者工具所使用的协议相同，但它作为可编程 API 暴露出来，可供自动化工具利用。

CDP 的核心是提供了一套全面的方法和事件，用于与浏览器内部进行交互。这使得我们可以精细控制浏览器的各个方面，从页面导航到操作 DOM、拦截网络请求和监控性能指标。

!!! info "CDP 的演进"
    自推出以来，Chrome 开发者工具协议一直在不断发展。Google 随着每个 Chrome 版本的发布都会维护和更新该协议，定期添加新功能并改进现有特性。
    
    虽然该协议最初是为 Chrome 的开发者工具设计的，但其全面的功能已使其成为下一代浏览器自动化工具（如 Puppeteer、Playwright，当然还有 Pydoll）的基础。

## WebSocket 通信

CDP 在架构上的一个关键决策是使用 WebSocket 进行通信。当基于 Chromium 的浏览器以启用远程调试标志启动时，它会在指定端口上打开一个 WebSocket 服务器：

```
chrome --remote-debugging-port=9222
```

Pydoll 连接到此 WebSocket 端点，以与浏览器建立双向通信通道。该连接：

1.  在整个自动化会话期间 **保持持久性**
2.  使浏览器能够将 **实时事件** 推送给客户端
3.  允许向浏览器 **发送命令**
4.  **支持二进制数据**，以高效传输屏幕截图、PDF 和其他资产

WebSocket 协议特别适用于浏览器自动化，因为它提供：

- **低延迟通信** - 响应式自动化所必需
- **双向消息传递** - 事件驱动架构的基础
- **持久连接** - 消除了每个操作的连接设置开销

以下是 Pydoll 与浏览器通信方式的简化视图：

```mermaid
sequenceDiagram
    participant App as Pydoll 应用程序
    participant WS as WebSocket 连接
    participant Browser as Chrome 浏览器

    App ->> WS: 命令：导航到 URL
    WS ->> Browser: 执行导航

    Browser -->> WS: 发送页面加载事件
    WS -->> App: 接收页面加载事件
```

!!! info "WebSocket vs HTTP"
    早期的浏览器自动化协议通常依赖 HTTP 端点进行通信。CDP 转向 WebSocket 代表了一项重大的架构改进，可实现响应更灵敏的自动化和实时事件监控。
    
    基于 HTTP 的协议需要持续轮询以检测变化，这会产生开销和延迟。WebSocket 允许浏览器在事件发生时立即将通知推送给您的自动化脚本，延迟极小。

## 关键 CDP 域

CDP 被组织成逻辑域，每个域负责浏览器功能的特定方面。一些最重要的域包括：


| 域 (Domain) | 职责 | 示例用例 |
|---|---|---|
| **Browser** | 控制浏览器应用程序本身 | 窗口管理、浏览器上下文创建 |
| **Page** | 与页面生命周期交互 | 导航、JavaScript 执行、框架管理 |
| **DOM** | 访问页面结构 | 查询选择器、属性修改、事件监听器 |
| **Network** | 网络流量监控和控制 | 请求拦截、响应检查、缓存 |
| **Runtime** | JavaScript 执行环境 | 评估表达式、调用函数、处理异常 |
| **Input** | 模拟用户交互 | 鼠标移动、键盘输入、触摸事件 |
| **Target** | 管理浏览器上下文和目标 | 创建标签页、访问 iframe、处理弹出窗口 |
| **Fetch** | 底层网络拦截 | 修改请求、模拟响应、身份验证 |

Pydoll 将这些 CDP 域映射到更直观的 API 结构中，同时保留了底层协议的全部功能。

## 事件驱动架构

CDP 最强大的功能之一是其事件系统。该协议允许客户端订阅浏览器在正常操作期间发出的各种事件。这些事件几乎涵盖了浏览器行为的各个方面：

- **生命周期事件**：页面加载、框架导航、目标创建
- **DOM 事件**：元素变化、属性修改
- **网络事件**：请求/响应周期、WebSocket 消息
- **执行事件**：JavaScript 异常、控制台消息
- **性能事件**：渲染、脚本和更多指标


当您在 Pydoll 中启用事件监控时（例如，使用 `page.enable_network_events()`），库会与浏览器设置必要的订阅，并为您的代码提供钩子以对这些事件做出反应。

```python
from pydoll.events.network import NetworkEvents
from functools import partial

async def on_request(page, event):
    url = event['params']['request']['url']
    print(f"Request to: {url}")

# 订阅网络请求事件
await page.enable_network_events()
await page.on(NetworkEvents.REQUEST_WILL_BE_SENT, partial(on_request, page))
```

这种事件驱动的方法允许自动化脚本立即对浏览器状态变化做出反应，而无需依赖低效的轮询或任意延迟。

## 直接 CDP 集成的性能优势

像 Pydoll 那样直接使用 CDP，与传统的基于 webdriver 的自动化相比，具有多种性能优势：

### 1. 消除协议转换层

传统的基于 webdriver 的工具（如 Selenium）使用多层方法：

```mermaid
graph LR
    AS[自动化脚本] --> WC[WebDriver 客户端]
    WC --> WS[WebDriver 服务器]
    WS --> B[浏览器]
```

每一层都会增加开销，尤其是 WebDriver 服务器，它充当 WebDriver 协议和浏览器本机 API 之间的转换层。

Pydoll 的方法将其简化为：

```mermaid
graph LR
    AS[自动化脚本] --> P[Pydoll]
    P --> B[通过 CDP 连接浏览器]
```

这种直接通信消除了中间服务器的计算和网络开销，从而加快了操作速度。

### 2. 高效的命令批处理

CDP 允许在单个消息中批处理多个命令，减少了复杂操作所需的往返次数。这对于需要多个步骤的操作（例如查找元素然后与其交互）特别有价值。

### 3. 异步操作

CDP 基于 WebSocket、事件驱动的架构与 Python 的 asyncio 框架完美契合，可实现真正的异步操作。这使得 Pydoll 能够：

- 并发执行多个操作
- 在事件发生时处理它们
- 在 I/O 操作期间避免阻塞主线程

```mermaid
graph TD
    subgraph "Pydoll 异步架构"
        EL[事件循环]
        
        subgraph "并发任务"
            T1[任务 1: 导航]
            T2[任务 2: 等待元素]
            T3[任务 3: 处理网络事件]
        end
        
        EL --> T1
        EL --> T2
        EL --> T3
        
        T1 --> WS[WebSocket 连接]
        T2 --> WS
        T3 --> WS
        
        WS --> B[浏览器]
    end
```

!!! info "异步性能提升"
    asyncio 和 CDP 的结合对性能产生了倍增效应。在基准测试中，Pydoll 的异步方法可以以接近线性的扩展性并行处理多个页面，而传统的同步工具在并发性增加时收益递减。
    
    例如，使用同步工具抓取 10 个各需 2 秒加载的页面可能需要超过 20 秒，但使用 Pydoll 的异步架构（加上一些最小的开销）仅需 2 秒多一点。

### 4. 精细的控制

CDP 提供了比 WebDriver 协议更精细的浏览器行为控制。这使得 Pydoll 能够为常见操作实施优化策略：

- 更精确的等待条件（而非任意超时）
- 直接访问浏览器缓存和存储
- 在特定上下文中定向执行 JavaScript
- 详细的网络控制以优化请求


## 结论

Chrome 开发者工具协议构成了 Pydoll 零 webdriver 浏览器自动化方法的基础。通过利用 CDP 的 WebSocket 通信、全面的域覆盖、事件驱动架构和直接的浏览器集成，Pydoll 实现了优于传统自动化工具的性能和可靠性。

在接下来的部分中，我们将更深入地探讨 Pydoll 如何实现特定的 CDP 域，并将低级协议转换为直观、对开发人员友好的 API。


================================================
FILE: docs/zh/deep-dive/fundamentals/connection-layer.md
================================================
# Connection Handler (连接处理器)

Connection Handler 是 Pydoll 架构的基础层，充当 Python 代码与浏览器 Chrome DevTools Protocol (CDP) 之间的桥梁。该组件管理与浏览器的 WebSocket 连接，处理命令执行，并以非阻塞、异步的方式处理事件。

```mermaid
graph TD
    A[Python 代码] --> B[Connection Handler]
    B <--> C[WebSocket]
    C <--> D[浏览器 CDP 端点]

    subgraph "Connection Handler"
        E[命令管理器]
        F[事件处理器]
        G[WebSocket 客户端]
    end

    B --> E
    B --> F
    B --> G
```

## 异步编程模型

Pydoll 构建于 Python 的 `asyncio` 框架之上，该框架支持非阻塞 I/O 操作。这种设计选择对于高性能的浏览器自动化至关重要，因为它允许多个操作并发执行，而无需等待每个操作完成。

### 理解 Async/Await


为了理解 async/await 在实践中如何工作，让我们看一个包含两个并发操作的更详细的示例：

```python
import asyncio
from pydoll.browser.chrome import Chrome

async def fetch_page_data(url):
    print(f"开始抓取 {url}")
    browser = Chrome()
    await browser.start()
    page = await browser.get_page()
    
    # 导航需要时间 - 这是我们让出控制权的地方
    await page.go_to(url)
    
    # 获取页面标题
    title = await page.execute_script("return document.title")
    
    # 提取一些数据
    description = await page.execute_script(
        "return document.querySelector('meta[name=\"description\"]')?.content || ''"
    )
    
    await browser.stop()
    print(f"完成抓取 {url}")
    return {"url": url, "title": title, "description": description}

async def main():
    # 并发启动两个页面操作
    task1 = asyncio.create_task(fetch_page_data("https://example.com"))
    task2 = asyncio.create_task(fetch_page_data("https://github.com"))
    
    # 等待两者完成并获取结果
    result1 = await task1
    result2 = await task2
    
    return [result1, result2]

# 运行异步函数
results = asyncio.run(main())
```

此示例演示了我们如何并发地从两个不同的网站获取数据，与顺序执行相比，这可能将总执行时间缩短近一半。

#### 异步执行流程图

以下是执行上述代码时事件循环中发生的情况：

```mermaid
sequenceDiagram
    participant A as 主代码
    participant B as 任务 1<br/> (example.com)
    participant C as 任务 2<br/> (github.com)
    participant D as 事件循环
    
    A->>B: 创建任务 1
    B->>D: 在循环中注册
    A->>C: 创建任务 2
    C->>D: 在循环中注册
    D->>B: 执行直到 browser.start()
    D->>C: 执行直到 browser.start()
    D-->>B: WebSocket 连接后恢复
    D-->>C: WebSocket 连接后恢复
    D->>B: 执行直到 page.go_to()
    D->>C: 执行直到 page.go_to()
    D-->>B: 页面加载后恢复
    D-->>C: 页面加载后恢复
    B-->>A: 返回结果
    C-->>A: 返回结果
```

此序列图说明了 Python 的 asyncio 如何管理我们示例代码中的两个并发任务：

1.  主函数创建两个任务，用于从不同网站获取数据
2.  两个任务都在事件循环中注册
3.  事件循环执行每个任务，直到遇到 `await` 语句（如 `browser.start()`）
4.  当异步操作完成时（如 WebSocket 连接建立），任务恢复执行
5.  循环在每个 `await` 点继续在任务之间切换
6.  当每个任务完成时，它将其结果返回给主函数

在 `fetch_page_data` 示例中，这允许两个浏览器实例并发工作 - 当一个实例等待页面加载时，另一个实例可以取得进展。这比顺序处理每个网站要高效得多，因为 I/O 等待时间不会阻塞其他任务的执行。

!!! info "协作式多任务"
    Asyncio 使用协作式多任务，其中任务在 `await` 点自愿让出控制权。这不同于抢占式多任务（线程），后者中任务可能在任何时候被中断。协作式多任务可以为 I/O 密集型操作提供更好的性能，但需要仔细编码以避免阻塞事件循环。

## Connection Handler 实现

`ConnectionHandler` 类旨在管理命令执行和事件处理，为 CDP WebSocket 连接提供了一个健壮的接口。

### 类初始化

```python
def __init__(
    self,
    connection_port: int,
    page_id: str = 'browser',
    ws_address_resolver: Callable[[int], str] = get_browser_ws_address,
    ws_connector: Callable = websockets.connect,
):
    # 初始化组件...
```

ConnectionHandler 接受几个参数：

| 参数 | 类型 | 描述 |
|---|---|---|
| `connection_port` | `int` | 浏览器 CDP 端点正在监听的端口号 |
| `page_id` | `str` | 特定页面/目标的标识符（用于浏览器级别的连接时使用 'browser'） |
| `ws_address_resolver` | `Callable` | 从端口号解析 WebSocket URL 的函数 |
| `ws_connector` | `Callable` | 建立 WebSocket 连接的函数 |

### 内部组件

ConnectionHandler 协调三个主要组件：

1.  **WebSocket 连接**：管理与浏览器的实际 WebSocket 通信
2.  **命令管理器**：处理发送命令和接收响应
3.  **事件处理器**：处理来自浏览器的事件并触发适当的回调

```mermaid
classDiagram
    class ConnectionHandler {
        -_connection_port: int
        -_page_id: str
        -_ws_connection
        -_command_manager: CommandManager
        -_events_handler: EventsHandler
        +execute_command(command, timeout) async
        +register_callback(event_name, callback) async
        +remove_callback(callback_id) async
        +ping() async
        +close() async
        -_receive_events() async
    }

    class CommandManager {
        -_pending_commands: dict
        +create_command_future(command)
        +resolve_command(id, response)
        +remove_pending_command(id)
    }

    class EventsHandler {
        -_callbacks: dict
        -_network_logs: list
        -_dialog: dict
        +register_callback(event_name, callback, temporary)
        +remove_callback(callback_id)
        +clear_callbacks()
        +process_event(event) async
    }

    ConnectionHandler *-- CommandManager
    ConnectionHandler *-- EventsHandler
```

## 命令执行流程

通过 CDP 执行命令时，ConnectionHandler 遵循特定模式：

1.  确保存在活动的 WebSocket 连接
2.  创建一个 Future 对象来表示挂起的响应
3.  通过 WebSocket 发送命令
4.  等待 Future 被响应解析
5.  将响应返回给调用者

```python
async def execute_command(self, command: dict, timeout: int = 10) -> dict:
    # 验证命令
    if not isinstance(command, dict):
        logger.error('Command must be a dictionary.')
        raise exceptions.InvalidCommand('Command must be a dictionary')

    # 确保连接处于活动状态
    await self._ensure_active_connection()
    
    # 为此命令创建 future
    future = self._command_manager.create_command_future(command)
    command_str = json.dumps(command)

    # 发送命令并等待响应
    try:
        await self._ws_connection.send(command_str)
        response: str = await asyncio.wait_for(future, timeout)
        return json.loads(response)
    except asyncio.TimeoutError as exc:
        self._command_manager.remove_pending_command(command['id'])
        raise exc
    except websockets.ConnectionClosed as exc:
        await self._handle_connection_loss()
        raise exc
```

!!! warning "命令超时"
    未在指定超时期限内收到响应的命令将引发 `TimeoutError`。这可以防止自动化脚本因缺少响应而无限期挂起。默认超时为 10 秒，但可以根据复杂操作的预期响应时间进行调整。

## 事件处理系统

事件系统是启用 Pydoll 中反应式编程模式的关键架构组件。它允许您为特定浏览器事件注册回调，并在这些事件发生时自动执行它们。

### 事件流

事件处理流程遵循以下步骤：

1.  `_receive_events` 方法作为后台任务运行，持续从 WebSocket 接收消息
2.  每条消息被解析并分类为命令响应或事件
3.  事件被传递给 EventsHandler 进行处理
4.  EventsHandler 识别该事件已注册的回调并调用它们

```mermaid
flowchart TD
    A[WebSocket 消息] --> B{是命令响应吗？}
    B -->|是| C[解析命令 Future]
    B -->|否| D[作为事件处理]
    D --> E[查找匹配的回调]
    E --> F[执行回调]
    F --> G{是临时的吗？}
    G -->|是| H[移除回调]
    G -->|否| I[保留回调]
```

### 回调注册

ConnectionHandler 提供了注册、移除和管理事件回调的方法：

```python
# 为特定事件注册回调
callback_id = await connection.register_callback(
    'Page.loadEventFired', 
    handle_page_load
)

# 移除特定回调
await connection.remove_callback(callback_id)

# 移除所有回调
await connection.clear_callbacks()
```

!!! tip "临时回调"
    您可以将回调注册为临时的，这意味着它在触发一次后将自动移除。这对于一次性事件（如处理对话框）很有用：
    
    ```python
    await connection.register_callback(
        'Page.javascriptDialogOpening',
        handle_dialog,
        temporary=True
    )
    ```

### 异步回调执行

回调可以是同步函数或异步协程。EventsHandler（由 ConnectionHandler 管理）可以正确处理这两种类型：

```python
# 同步回调
def synchronous_callback(event):
    print(f"Event received: {event['method']}")

# 异步回调
async def asynchronous_callback(event):
    await asyncio.sleep(0.1)  # 执行一些异步操作
    print(f"Event processed asynchronously: {event['method']}")

# 两者都可以用相同的方式注册
await connection.register_callback('Network.requestWillBeSent', synchronous_callback)
await connection.register_callback('Network.responseReceived', asynchronous_callback)
```

**顺序执行模型：**

异步回调由 EventsManager **顺序等待 (await)**。这确保了对于单个事件，回调按照它们注册的顺序执行，防止了多个回调修改共享状态时出现竞争条件。

```python
# 在 EventsManager.process_event() 内部
for callback_data in callbacks:
    if asyncio.iscoroutinefunction(callback_data['callback']):
        await callback_data['callback'](event_data)  # 顺序 await
    else:
        callback_data['callback'](event_data)  # 同步执行
```

**非阻塞执行**（用于不应阻塞其他操作的 UI 回调）是在 **更高层** 实现的，例如在 `Tab.on()` 方法中，它在注册用户回调之前将其包装在 `asyncio.create_task()` 中。这种架构提供了：

- **底层** (ConnectionHandler/EventsManager)：保证顺序执行和可预测的顺序
- **高层** (Tab.on())：在需要时提供非阻塞语义

!!! info "事件架构详情"
    有关多层事件系统和顺序回调执行原理的完整详细信息，请参阅 [事件架构深入探讨](../architecture/event-architecture.md)。

## 连接管理

ConnectionHandler 实现了多种策略以确保连接的健壮性：

### 延迟连接建立

仅在需要时才建立连接，通常是在执行第一个命令时或明确请求时。这种延迟初始化方法可以节省资源，并允许更灵活的连接管理。

### 自动重新连接

如果 WebSocket 连接意外丢失或关闭，ConnectionHandler 将在执行下一个命令时尝试自动重新建立连接。这提供了对瞬态网络问题的弹性。

```python
async def _ensure_active_connection(self):
    """
    保证在继续之前存在活动连接。
    """
    if self._ws_connection is None or self._ws_connection.closed:
        await self._establish_new_connection()
```

### 资源清理

ConnectionHandler 实现了显式清理方法和 Python 的异步上下文管理器协议（`__aenter__` 和 `__aexit__`），确保在不再需要资源时正确释放它们：

```python
async def close(self):
    """
    关闭 WebSocket 连接并清除所有回调。
    """
    await self.clear_callbacks()
    if self._ws_connection is not None:
        try:
            await self._ws_connection.close()
        except websockets.ConnectionClosed as e:
            logger.info(f'WebSocket connection has closed: {e}')
        logger.info('WebSocket connection closed.')
```

!!! info "上下文管理器用法"
    将 ConnectionHandler 用作上下文管理器是确保正确清理资源的的推荐模式：
    
    ```python
    async with ConnectionHandler(9222, 'browser') as connection:
        # 使用连接...
        await connection.execute_command(...)
    # 退出上下文时自动关闭连接
    ```

## 消息处理管道

ConnectionHandler 实现了一个复杂的消息处理管道，用于处理来自 WebSocket 连接的连续消息流：

```mermaid
sequenceDiagram
    participant WS as WebSocket
    participant RCV as _receive_events
    participant MSG as _process_single_message
    participant PARSE as _parse_message
    participant CMD as _handle_command_message
    participant EVT as _handle_event_message
    
    loop 当连接时
        WS->>RCV: 消息
        RCV->>MSG: 原始消息
        MSG->>PARSE: 原始消息
        PARSE-->>MSG: 解析后的 JSON 或 None
        
        alt 是命令响应
            MSG->>CMD: 消息
            CMD->>CMD: 解析命令 future
        else 是事件通知
            MSG->>EVT: 消息
            EVT->>EVT: 处理事件并触发回调
        end
    end
```

该管道确保了命令响应和异步事件的高效处理，使 Pydoll 即使在大量消息的情况下也能保持响应灵敏的操作。

## 高级用法

ConnectionHandler 通常通过 Browser 和 Page 类间接使用，但也可以直接用于高级场景：

### 直接事件监控

对于特殊用例，您可能希望绕过更高级别的 API，直接监控特定的 CDP 事件：

```python
from pydoll.connection.connection import ConnectionHandler

async def monitor_network():
    connection = ConnectionHandler(9222)
    
    async def log_request(event):
        url = event['params']['request']['url']
        print(f"Request: {url}")
    
    await connection.register_callback(
        'Network.requestWillBeSent', 
        log_request
    )
    
    # 通过 CDP 命令启用网络事件
    await connection.execute_command({
        "id": 1,
        "method": "Network.enable"
    })
    
    # 持续运行直到被中断
    try:
        while True:
            await asyncio.sleep(1)
    finally:
        await connection.close()
```

### 自定义命令执行

您可以直接执行任意 CDP 命令：

```python
async def custom_cdp_command(connection, method, params=None):
    command = {
        "id": random.randint(1, 10000),
        "method": method,
        "params": params or {}
    }
    return await connection.execute_command(command)

# 示例：不使用 Page 类获取文档 HTML
async def get_html(connection):
    result = await custom_cdp_command(
        connection,
        "Runtime.evaluate",
        {"expression": "document.documentElement.outerHTML"}
    )
    return result['result']['result']['value']
```

!!! warning "高级接口"
    直接使用 ConnectionHandler 需要深入了解 Chrome DevTools 协议。对于大多数用例，更高级别的 Browser 和 Page API 提供了更直观、更安全的接口。


## 高级并发模式

ConnectionHandler 的异步设计支持复杂的并发模式：

### 并行命令执行

并发执行多个命令并等待所有结果：

```python
async def get_page_metrics(connection):
    commands = [
        {"id": 1, "method": "Performance.getMetrics"},
        {"id": 2, "method": "Network.getResponseBody", "params": {"requestId": "..."}},
        {"id": 3, "method": "DOM.getDocument"}
    ]
    
    results = await asyncio.gather(
        *(connection.execute_command(cmd) for cmd in commands)
    )
    
    return results
```

## 结论

ConnectionHandler 是 Pydoll 架构的基础，为 Chrome DevTools 协议提供了健壮、高效的接口。通过利用 Python 的 asyncio 框架和 WebSocket 通信，它支持高性能的浏览器自动化，并具有优雅的、事件驱动的编程模式。

理解 ConnectionHandler 的设计和操作，有助于深入了解 Pydoll 的内部工作原理，并为在特殊场景下进行高级定制和优化提供了机会。

对于大多数用例，您将通过更高级别的 Browser 和 Page API 间接与 ConnectionHandler 交互，这些 API 提供了更直观的接口，同时利用了 ConnectionHandler 的强大功能。

================================================
FILE: docs/zh/deep-dive/fundamentals/iframes-and-contexts.md
================================================
# Iframes、OOPIF 和执行上下文（深度解析）

理解浏览器自动化如何处理 iframe 对于构建健壮的自动化工具至关重要。本综合指南探讨了 Pydoll 中 iframe 处理的技术基础，涵盖了文档对象模型 (DOM)、Chrome DevTools 协议 (CDP) 机制、执行上下文、隔离世界 (isolated worlds) 以及使 iframe 交互变得无缝的复杂解析管道。

!!! info "实用用法优先"
    如果您只需要在自动化脚本中使用 iframe，请从功能指南开始：**功能 → 自动化 → IFrames**。
    本深度解析解释了架构决策、协议的细微差别以及内部实现细节。

---

## 目录

1. [基础：文档对象模型 (DOM)](#基础文档对象模型-dom)
2. [什么是 Iframes 及其重要性](#什么是-iframes-及其重要性)
3. [挑战：跨进程 Iframes (OOPIFs)](#挑战跨进程-iframes-oopifs)
4. [Chrome DevTools 协议和 Frame 管理](#chrome-devtools-协议和-frame-管理)
5. [执行上下文和隔离世界](#执行上下文和隔离世界)
6. [CDP 标识符参考](#cdp-标识符参考)
7. [Pydoll 的解析管道](#pydoll-的解析管道)
8. [会话路由和扁平化模式](#会话路由和扁平化模式)
9. [实现深度解析](#实现深度解析)
10. [性能考量](#性能考量)
11. [失败模式和调试](#失败模式和调试)

---

## 基础：文档对象模型 (DOM)

在深入研究 iframe 之前，我们必须了解 DOM——在内存中表示 HTML 文档的树形结构。

### 什么是 DOM？

**文档对象模型** (Document Object Model) 是 HTML 和 XML 文档的编程接口。它将页面结构表示为一个节点树，其中每个节点对应文档的一部分：

- **元素节点**：HTML 标签，如 `<div>`、`<iframe>`、`<button>`
- **文本节点**：实际的文本内容
- **属性节点**：元素属性，如 `id`、`class`、`src`
- **文档节点**：树的根节点

```mermaid
graph TD
    Document[文档] --> HTML[html 元素]
    HTML --> Head[head 元素]
    HTML --> Body[body 元素]
    Body --> Div1[div 元素]
    Body --> Div2[div 元素]
    Div1 --> Text1[文本节点: 'Hello']
    Div2 --> Iframe[iframe 元素]
    Iframe --> IframeDoc[iframe 的文档]
    IframeDoc --> IframeBody[iframe body]
    IframeBody --> IframeContent[iframe 内容...]
```

### DOM 树属性

1. **层级结构**：每个节点都有一个父节点（Document 除外），并且可以有子节点
2. **节点标识**：节点可以通过以下方式标识：
   - `nodeId`：文档上下文（DOM 域）内的内部标识符
   - `backendNodeId`：可以跨不同文档引用节点的稳定标识符
3. **实时表示**：对 DOM 的更改会立即反映在树中

### 为什么这对 Iframes 很重要

每个 `<iframe>` 元素都会创建一个**新的、独立的 DOM 树**。 iframe 元素本身存在于父级的 DOM 中，但加载到 iframe 中的内容拥有自己完整的 Document 节点和树结构。这种分离是所有 iframe 复杂性的基础。

---

## 什么是 Iframes 及其重要性

### 定义

**iframe**（内联框架）是一个 HTML 元素（`<iframe>`），它在当前页面中嵌入另一个 HTML 文档。被嵌入的文档保持其自己的上下文，包括：

- 独立的 HTML 结构和 DOM 树
- 独立的 JavaScript 执行环境
- 自己的 CSS 样式（除非明确共享）
- 不同的导航历史

```html
<body>
  <h1>父页面</h1>
  <iframe src="https://example.com/embedded.html" id="content-frame"></iframe>
  <p>更多父页面内容</p>
</body>
```

### 常见用例

| 用例 | 描述 | 示例 |
|----------|-------------|---------|
| **第三方小部件** | 安全地嵌入外部内容 | 支付表单、社交媒体 feeds、聊天窗口 |
| **内容隔离** | 沙盒化不受信任的内容 | 用户生成的 HTML、广告 |
| **模块化架构** | 可重用组件 | 仪表盘小部件、插件系统 |
| **跨域内容** | 从不同域加载资源 | 地图、视频播放器、分析仪表盘 |

### 安全模型：同源策略 (Same-Origin Policy)

浏览器对 iframes 强制执行**同源策略**：

- **同源 iframes**：父级可以通过 JavaScript 访问 iframe 的 DOM (`iframe.contentDocument`)
- **跨域 iframes**：父级不能直接访问 iframe 的 DOM（安全限制）

这个安全边界就是为什么自动化工具需要特殊机制（如 CDP）来与 iframe 内容交互。

!!! warning "对自动化很重要"
    由于浏览器安全限制，传统的基于 JavaScript 的自动化（如 Selenium 的早期方法）无法直接访问跨域 iframe 的内容。CDP 在更底层运行，出于调试目的绕过了这个限制。

---

## 挑战：跨进程 Iframes (OOPIFs)

### 什么是 OOPIFs？

现代 Chromium 使用**站点隔离 (site isolation)** 来提高安全性和稳定性。这意味着不同的源 (origin) 可能会在单独的操作系统进程中渲染。来自不同源的 iframe 会成为**跨进程 Iframe (OOPIF)**。

```mermaid
graph LR
    subgraph "进程 1: example.com"
        MainPage[主页面 DOM]
    end
    
    subgraph "进程 2: widget.com"
        IframeDOM[Iframe DOM]
    end
    
    MainPage -.进程边界.-> IframeDOM
```

### 为什么 OOPIFs 使自动化复杂化

| 方面 | 进程内 Iframe | 跨进程 Iframe (OOPIF) |
|--------|-------------------|-------------------------------|
| **DOM 访问** | 内存中共享的文档树 | 拥有自己文档的独立目标 (target) |
| **命令路由** | 单个连接 | 需要目标附加 (target attachment) 和会话路由 (session routing) |
| **Frame 树** | 所有 frames 在一棵树中 | 根 frame + OOPIFs 的独立目标 |
| **JavaScript 上下文** | 相同的执行上下文 | 每个进程有不同的执行上下文 |
| **CDP 通信** | 直接命令 | 命令必须包含 `sessionId` |

### 传统方法（手动切换上下文）

没有复杂的处理，自动化 OOPIFs 需要：

```python
# 其他工具的传统（手动）方法
main_page = browser.get_page()
iframe_element = main_page.find_element_by_id("iframe-id")

# 必须手动切换上下文
driver.switch_to.frame(iframe_element)

# 现在命令指向 iframe
button = driver.find_element_by_id("button-in-iframe")
button.click()

# 必须手动切换回来
driver.switch_to.default_content()
```

**这种方法的问题：**

1. **开发者负担**：每个 iframe 都需要显式的上下文管理
2. **嵌套 iframes**：每一层都需要再次切换
3. **OOPIF 检测**：很难知道何时需要手动附加
4. **容易出错**：忘记切换回来 → 后续命令失败
5. **不可组合**：辅助函数必须知道它们所处的 iframe 上下文

### Pydoll 的解决方案：透明的上下文解析

Pydoll 通过自动解析 iframe 上下文来消除手动上下文切换：

```python
# Pydoll 方法（无手动切换）
iframe = await tab.find(id="iframe-id")
button = await iframe.find(id="button-in-iframe")
await button.click()

# 嵌套 iframes？同样的模式
outer = await tab.find(id="outer-iframe")
inner = await outer.find(tag_name="iframe")
button = await inner.find(text="Submit")
await button.click()
```

复杂性在内部处理。让我们来探究一下是如何做到的。

---

## Chrome DevTools 协议和 Frame 管理

正如在 [深度解析 → 基础 → Chrome DevTools 协议](./cdp.md) 中讨论的，CDP 通过 WebSocket 通信提供全面的浏览器控制。Frame 管理分散在多个 CDP 域中。

### 相关的 CDP 域

#### 1. **Page 域**

管理页面生命周期、frames 和导航。

**关键方法：**

- `Page.getFrameTree()`：返回页面中所有 frames 的层级结构
  ```json
  {
    "frameTree": {
      "frame": {
        "id": "main-frame-id",
        "url": "https://example.com",
        "securityOrigin": "https://example.com",
        "mimeType": "text/html"
      },
      "childFrames": [
        {
          "frame": {
            "id": "child-frame-id",
            "parentId": "main-frame-id",
            "url": "https://widget.com/embed"
          }
        }
      ]
    }
  }
  ```

- `Page.createIsolatedWorld(frameId, worldName)`：在特定 frame 中创建一个新的 JavaScript 执行上下文
  ```json
  {
    "executionContextId": 42
  }
  ```

**Pydoll 用法：**

```python
# 源自 pydoll/elements/web_element.py
@staticmethod
async def _get_frame_tree_for(
    handler: ConnectionHandler, session_id: Optional[str]
) -> FrameTree:
    """获取给定连接/目标的 Page frame 树。"""
    command = PageCommands.get_frame_tree()
    if session_id:
        command['sessionId'] = session_id
    response: GetFrameTreeResponse = await handler.execute_command(command)
    return response['result']['frameTree']
```

#### 2. **DOM 域**

提供对 DOM 结构的访问。

**关键方法：**

- `DOM.describeNode(objectId)`：返回有关 DOM 节点的详细信息
  ```json
  {
    "node": {
      "nodeId": 123,
      "backendNodeId": 456,
      "nodeName": "IFRAME",
      "frameId": "parent-frame-id",
      "contentDocument": {
        "frameId": "iframe-frame-id",
        "documentURL": "https://embedded.com/page.html"
      }
    }
  }
  ```

- `DOM.getFrameOwner(frameId)`：返回拥有某个 frame 的 `<iframe>` 元素的 `backendNodeId`
  ```json
  {
    "backendNodeId": 456
  }
  ```

**Pydoll 用法：**

```python
# 源自 pydoll/elements/web_element.py
@staticmethod
async def _owner_backend_for(
    handler: ConnectionHandler, session_id: Optional[str], frame_id: str
) -> Optional[int]:
    """获取拥有给定 frame 的 DOM 元素的 backendNodeId。"""
    command = DomCommands.get_frame_owner(frame_id=frame_id)
    if session_id:
        command['sessionId'] = session_id
    response: GetFrameOwnerResponse = await handler.execute_command(command)
    return response.get('result', {}).get('backendNodeId')
```

#### 3. **Target 域**

管理浏览器目标（页面、iframes、workers 等）。

**关键方法：**

- `Target.getTargets()`：列出所有可用的目标
  ```json
  {
    "targetInfos": [
      {
        "targetId": "page-target-id",
        "type": "page",
        "title": "Main Page",
        "url": "https://example.com"
      },
      {
        "targetId": "iframe-target-id",
        "type": "iframe",
        "title": "",
        "url": "https://widget.com/embed",
        "parentFrameId": "main-frame-id"
      }
    ]
  }
  ```

- `Target.attachToTarget(targetId, flatten)`：附加到一个目标以进行调试
  - 当 `flatten=true` 时：返回一个 `sessionId` 用于在扁平化模式下路由命令
  - 所有通信都通过同一个 WebSocket 进行，通过 `sessionId` 区分

**Pydoll 用法：**

```python
# 源自 pydoll/interactions/iframe.py (简化版)
async def _resolve_oopif_by_parent(self, content_frame_id: str, ...):
    """使用 content frame id 解析 OOPIF。"""
    browser_handler = ConnectionHandler(...)
    targets_response: GetTargetsResponse = await browser_handler.execute_command(
        TargetCommands.get_targets()
    )
    target_infos = targets_response.get('result', {}).get('targetInfos', [])

    # 查找 parentFrameId 匹配的目标
    direct_children = [
        target_info for target_info in target_infos
        if target_info.get('parentFrameId') == content_frame_id
    ]
    
    if direct_children:
        attach_response: AttachToTargetResponse = await browser_handler.execute_command(
            TargetCommands.attach_to_target(
                target_id=direct_children[0]['targetId'], 
                flatten=True
            )
        )
        attached_session_id = attach_response.get('result', {}).get('sessionId')
        # ... 对后续命令使用 session_id
```

#### 4. **Runtime 域**

执行 JavaScript 并管理执行上下文。

**关键方法：**

- `Runtime.evaluate(expression, contextId)`：在特定的执行上下文中评估 JavaScript
- `Runtime.callFunctionOn(functionDeclaration, objectId)`：在一个特定对象上调用函数（作为 `this`）

**Pydoll 用于 iframe 文档访问的用法：**

```python
# 源自 pydoll/elements/web_element.py
async def _set_iframe_document_object_id(self, execution_context_id: int):
    """在 iframe 上下文中评估 document.documentElement 并缓存其 object id。"""
    evaluate_command = RuntimeCommands.evaluate(
        expression='document.documentElement',
        context_id=execution_context_id,
    )
    if self._iframe_context and self._iframe_context.session_id:
        evaluate_command['sessionId'] = self._iframe_context.session_id
    
    evaluate_response: EvaluateResponse = await (
        (self._iframe_context.session_handler if self._iframe_context else None)
        or self._connection_handler
    ).execute_command(evaluate_command)
    
    document_object_id = evaluate_response.get('result', {}).get('result', {}).get('objectId')
    if self._iframe_context:
        self._iframe_context.document_object_id = document_object_id
```

---

## 执行上下文和隔离世界

### 什么是执行上下文？

**执行上下文** (execution context) 是执行 JavaScript 代码的环境。浏览器中的每个 frame 至少有一个执行上下文。该上下文包括：

- **全局对象**（在浏览器中是 `window`）
- **作用域链**：如何解析变量
- **This 绑定**：`this` 指向什么
- **变量环境**：所有声明的变量和函数

### 每个 Frame 的多个上下文

单个 frame 可以有多个执行上下文：

1. **主世界 (main world)（默认上下文）**：页面自己的 JavaScript 运行的地方
2. **隔离世界 (isolated worlds)**：共享相同 DOM 但具有不同 JavaScript 全局作用域的独立上下文

```mermaid
graph TB
    Frame[Frame: example.com/page]
    Frame --> MainWorld[主世界<br/>页面的 JavaScript]
    Frame --> IsolatedWorld1[隔离世界 1<br/>扩展的内容脚本]
    Frame --> IsolatedWorld2[隔离世界 2<br/>Pydoll 自动化]
    
    DOM[共享的 DOM 树]
    MainWorld -.可以访问.-> DOM
    IsolatedWorld1 -.可以访问.-> DOM
    IsolatedWorld2 -.可以访问.-> DOM
    
    MainWorld -.无法访问.-> IsolatedWorld1
    MainWorld -.无法访问.-> IsolatedWorld2
```

### 什么是隔离世界？

**隔离世界** (isolated world) 是一个独立的 JavaScript 执行上下文，它：

- **共享相同的 DOM**：可以读取/修改 DOM 元素
- **拥有独立的全局对象**：变量/函数不会在世界之间泄漏
- **防止干扰**：页面脚本无法检测或干扰隔离世界中的脚本

**起源**：隔离世界是为浏览器扩展创建的。内容脚本 (Content scripts) 运行在隔离世界中，因此它们可以与页面 DOM 交互，而不会：

- 被页面脚本覆盖其变量
- 被防篡改代码检测到
- 与页面的 JavaScript 冲突

### 为什么 Pydoll 对 Iframes 使用隔离世界

当 Pydoll 与 iframe 内容交互时，它会在该 iframe 的上下文中创建一个隔离世界。这提供了：

1. **干净的 JavaScript 环境**：与 iframe 自己的脚本没有冲突
2. **一致的行为**：无论 iframe 运行什么 JavaScript，自动化脚本都能工作
3. **反检测**：iframe 的 JavaScript 无法轻易检测到 Pydoll 的存在
4. **安全的评估**：自动化代码不会意外触发页面逻辑

**实现：**

```python
# 源自 pydoll/elements/web_element.py
@staticmethod
async def _create_isolated_world_for_frame(
    frame_id: str,
    handler: ConnectionHandler,
    session_id: Optional[str],
) -> int:
    """为给定的 frame 创建一个隔离世界 (Page.createIsolatedWorld)。"""
    create_command = PageCommands.create_isolated_world(
        frame_id=frame_id,
        world_name=f'pydoll::iframe::{frame_id}',
        grant_universal_access=True,
    )
    if session_id:
        create_command['sessionId'] = session_id
    
    create_response: CreateIsolatedWorldResponse = await handler.execute_command(
        create_command
    )
    execution_context_id = create_response.get('result', {}).get('executionContextId')
    if not execution_context_id:
        raise InvalidIFrame('无法为 iframe 创建隔离世界')
    return execution_context_id
```

`grant_universal_access=True` 参数允许隔离世界：

- 访问跨域 frames（通常被同源策略阻止）
- 执行自动化所需的特权操作

!!! tip "实践中的隔离世界"
    每当您使用 `await iframe.find(...)` 时，Pydoll 都会在专门为该 iframe 创建的隔离世界中评估选择器查询。这确保您的自动化逻辑永远不会与 iframe 自己的 JavaScript 冲突，并且 iframe 无法检测或阻止您的自动化。

---

## CDP 标识符参考

理解 CDP 标识符对于处理 iframe 至关重要。这是一个全面的参考：

| 标识符 | 域 | 范围 | 目的 | 在 Pydoll 中的用例 |
|------------|--------|-------|---------|----------------------|
| **`nodeId`** | DOM | 文档局部 | 在特定文档上下文中标识一个 DOM 节点 | 内部 CDP 操作；在导航中不稳定 |
| **`backendNodeId`** | DOM | 跨文档稳定 | DOM 节点的稳定标识符；可以将 frames 映射到所有者元素 | 用于通过 `DOM.getFrameOwner` 将 iframe 元素与 frame IDs 匹配 |
| **`frameId`** | Page | Frame | 标识页面 frame 树中的一个 frame | 用于为 `Page.createIsolatedWorld` 和 frame 树遍历指定哪个 frame |
| **`targetId`** | Target | 全局 | 标识一个调试目标（页面、iframe、worker 等） | 用于 `Target.attachToTarget` 以连接到 OOPIFs |
| **`sessionId`** | Target | 目标特定 | 在扁平化模式下将命令路由到特定目标 | 注入到命令中，将它们路由到正确的 OOPIF |
| **`executionContextId`** | Runtime | Frame + 世界 | 标识一个 JavaScript 执行上下文（包括隔离世界） | 由 `Page.createIsolatedWorld` 返回；用于 `Runtime.evaluate` |
| **`objectId`** | Runtime | 执行上下文 | 远程对象引用（例如 DOM 元素、函数、对象） | 对 iframe 的 `document.documentElement` 的引用，用于相对查询 |

### 标识符关系

以下是 iframe 解析期间标识符之间的关系：

```
┌─────────────────────────────────────────────────────────────────────────┐
│                         解析流程                                        │
└─────────────────────────────────────────────────────────────────────────┘

1. 开始: <iframe> 元素
   └─ backendNodeId: 789
   
2. 查找 Frame ──────────────[DOM.getFrameOwner]──────────────┐
   └─ frameId: abc-123                                       │
                                                             │
3. OOPIF? 检查源 ─────[检测到不同源]──────┤
   └─ targetId: xyz-456                                      │
                                                             │
4. 附加到目标 ────────[Target.attachToTarget]──────────┤
   └─ sessionId: session-789                                 │
                                                             │
5. 创建隔离世界 ───[Page.createIsolatedWorld]───────┤
   └─ executionContextId: 42                                 │
                                                             │
6. 获取文档 ────────────[Runtime.evaluate]───────────────┘
   └─ objectId: obj-999
```

**关键转换点：**

| 从 | 方法 | 到 | 目的 |
|------|--------|-----|---------|
| `backendNodeId` | `DOM.getFrameOwner` | `frameId` | 查找哪个 frame 拥有该 iframe 元素 |
| `targetId` | `Target.attachToTarget(flatten=true)` | `sessionId` | 连接到 OOPIF 以进行命令路由 |
| `frameId` | `Page.createIsolatedWorld` | `executionContextId` | 创建安全的 JavaScript 环境 |
| `executionContextId` | `Runtime.evaluate('document.documentElement')` | `objectId` | 获取对 iframe 文档的引用 |

### Pydoll 中的代码表示

```python
# 源自 pydoll/elements/web_element.py
@dataclass
class _IFrameContext:
    """封装 iframe 的所有标识符和路由信息。"""
    frame_id: str                                   # frameId: 标识 frame
    document_url: Optional[str] = None              # frame 加载的 URL
    execution_context_id: Optional[int] = None      # executionContextId: 隔离世界
    document_object_id: Optional[str] = None        # objectId: document.documentElement
    session_handler: Optional[ConnectionHandler] = None  # 用于 OOPIF 目标
    session_id: Optional[str] = None                # sessionId: 将命令路由到 OOPIF
```

这个 dataclass 被缓存在代表 iframe 的每个 `WebElement` 上，实现了所有后续操作的自动路由。

---

## Pydoll 的解析管道

当您在 Pydoll 中访问 iframe（例如，`await iframe.find(...)`）时，一个精密的解析管道会在幕后执行。本节分解了每一步。

### 高级流程

```mermaid
sequenceDiagram
    participant User as 用户
    participant WebElement
    participant Pipeline as 解析管道
    participant CDP
    
    用户->>WebElement: iframe.find(id='button')
    WebElement->>WebElement: 检查 iframe 上下文是否已缓存
    alt 上下文未缓存
        WebElement->>Pipeline: _ensure_iframe_context()
        Pipeline->>CDP: DOM.describeNode(iframe)
        CDP-->>Pipeline: 节点信息 (frameId?, backendNodeId, 等)
        
        alt 节点信息中没有 frameId
            Pipeline->>Pipeline: _resolve_frame_by_owner()
            Pipeline->>CDP: Page.getFrameTree()
            CDP-->>Pipeline: Frame 树
            Pipeline->>CDP: DOM.getFrameOwner(每个 frame)
            CDP-->>Pipeline: backendNodeId
            Pipeline->>Pipeline: 匹配 backendNodeId 以查找 frameId
        end
        
        alt frameId 仍然缺失 (OOPIF)
            Pipeline->>Pipeline: _resolve_oopif_by_parent()
            Pipeline->>CDP: Target.getTargets()
            CDP-->>Pipeline: 目标列表
            Pipeline->>CDP: Target.attachToTarget(targetId, flatten=true)
            CDP-->>Pipeline: sessionId
            Pipeline->>CDP: Page.getFrameTree(sessionId)
            CDP-->>Pipeline: OOPIF frame 树
        end
        
        Pipeline->>CDP: Page.createIsolatedWorld(frameId)
        CDP-->>Pipeline: executionContextId
        
        Pipeline->>CDP: Runtime.evaluate('document.documentElement', contextId)
        CDP-->>Pipeline: objectId (文档引用)
        
        Pipeline->>WebElement: 缓存 _IFrameContext
    end
    
    WebElement->>WebElement: 使用缓存的上下文进行 find()
    WebElement-->>用户: 按钮元素 (带上下文)
```

### 步骤深度解析

#### **步骤 1：描述 Iframe 元素**

**目标**：从 `<iframe>` DOM 元素中提取元数据。

**方法**：`DOM.describeNode(objectId=iframe_object_id)`

**我们得到什么**：

- `backendNodeId`：iframe 元素的稳定标识符
- `frameId`（来自 `contentDocument`）：如果 iframe 的内容已加载并在进程内
- `documentURL`：iframe 中加载的 URL
- `parentFrameId`（来自节点上的 `frameId` 字段）：包含此 iframe 元素的 frame

**代码**：

```python
# 源自 pydoll/interactions/iframe.py
async def resolve(self) -> IFrameContext:
    """解析并返回 iframe 上下文。"""
    base_handler, base_session_id = self._get_base_session()
    node_info = await self._describe_element_node(base_handler, base_session_id)
    frame_id, document_url, content_frame_id, backend_node_id = self._extract_frame_metadata(
        node_info
    )
    # ... 继续解析
```

**辅助方法**：

```python
@staticmethod
def _extract_frame_metadata(
    node_info: Node,
) -> tuple[Optional[str], Optional[str], Optional[str], Optional[int]]:
    """从 DOM.describeNode 节点中提取 iframe 相关的元数据。"""
    content_document = node_info.get('contentDocument') or {}
    content_frame_id = node_info.get('frameId')
    backend_node_id = node_info.get('backendNodeId')
    frame_id = content_document.get('frameId')
    document_url = (
        content_document.get('documentURL')
        or content_document.get('baseURL')
        or node_info.get('documentURL')
        or node_info.get('baseURL')
    )
    return frame_id, document_url, content_frame_id, backend_node_id
```

**结果**：

- **如果 `frame_id` 存在**：很好！iframe 在进程内；进入步骤 4。
- **如果 `frame_id` 缺失**：iframe 可能是 OOPIF 或未完全加载；进入步骤 2。

---

#### **步骤 2：通过所有者解析 Frame（backendNodeId 匹配）**

**目标**：通过将 iframe 元素的 `backendNodeId` 与 frame 树中的 frame 所有者匹配，来找到 `frameId`。

**策略**：

1. 获取页面的 frame 树 (`Page.getFrameTree`)
2. 对树中的每个 frame，调用 `DOM.getFrameOwner(frameId)` 来获取所属 iframe 元素的 `backendNodeId`
3. 与我们的 iframe 的 `backendNodeId` 进行比较
4. 当它们匹配时，我们就找到了正确的 `frameId`

**代码**：

```python
# 源自 pydoll/elements/web_element.py
async def _resolve_frame_by_owner(
    self,
    base_handler: ConnectionHandler,
    base_session_id: Optional[str],
    backend_node_id: int,
    current_document_url: Optional[str],
) -> tuple[Optional[str], Optional[str]]:
    """通过匹配所有者的 backend_node_id 来解析 frame id 和 URL。"""
    owner_frame_id, owner_url = await self._find_frame_by_owner(
        base_handler, base_session_id, backend_node_id
    )
    if not owner_frame_id:
        return None, current_document_url
    return owner_frame_id, owner_url or current_document_url

async def _find_frame_by_owner(
    self, handler: ConnectionHandler, session_id: Optional[str], backend_node_id: int
) -> tuple[Optional[str], Optional[str]]:
    """通过匹配 <iframe> 元素的所有者 backend_node_id 来查找 frame。"""
    frame_tree = await self._get_frame_tree_for(handler, session_id)
    for frame_node in WebElement._walk_frames(frame_tree):
        candidate_frame_id = frame_node.get('id', '')
        if not candidate_frame_id:
            continue
        owner_backend_id = await self._owner_backend_for(
            handler, session_id, candidate_frame_id
        )
        if owner_backend_id == backend_node_id:
            return candidate_frame_id, frame_node.get('url')
    return None, None
```

**为什么这是必要的**：

- 对于跨域或延迟加载的 iframes，`DOM.describeNode` 有时不包含 `contentDocument.frameId`
- frame 树总是包含所有 frames（甚至是 OOPIFs），所以我们可以间接找到它

**结果**：

- **如果找到 `frameId`**：进入步骤 4。
- **如果仍然找不到**：iframe 很可能是一个在独立目标中的 OOPIF；进入步骤 3。

---

#### **步骤 3：通过父 Frame 解析 OOPIF**

**目标**：对于跨进程 Iframes，找到正确的目标，附加到它，并从该目标的 frame 树中获取 `frameId`（以及必要时用于路由的 `sessionId`）。

**何时会进入此步骤**：

- 已经有 `frameId` 且**没有** `backendNodeId` 的同源 / 进程内 iframe 会跳过此步骤（直接使用 `frameId`）。
- 具有 `backendNodeId` 的跨域 / OOPIF iframe，或在步骤 2 中仍无法解析 `frameId` 的 iframe，会进入此步骤。

**策略**：

**3a. 直接子目标查找（快速路径）**：

1. 调用 `Target.getTargets()` 列出所有调试目标。
2. 筛选 `type` 为 `"iframe"` 或 `"page"` 且 `parentFrameId` 与我们的父 frame 匹配的目标。
3. 如果只有**一个**匹配的子目标且**没有 `backendNodeId`**，则直接使用 `Target.attachToTarget(targetId, flatten=true)` 附加到该目标。
4. 为该目标获取 `Page.getFrameTree(sessionId)`；此树的根 frame 就是我们 iframe 的 frame。

当存在**多个**直接子目标或我们有 `backendNodeId`（典型 OOPIF 情况）时，Pydoll 会对每个子目标执行以下流程：

1. 使用 `Target.attachToTarget(flatten=true)` 附加。
2. 获取 `Page.getFrameTree(sessionId)` 并读取根 `frame.id`。
3. 在**主连接**上调用 `DOM.getFrameOwner(frameId=root_id)`。
4. 将返回的 `backendNodeId` 与 iframe 元素自身的 `backendNodeId` 比较。
5. 根所有者匹配的那个子目标被选为正确的 OOPIF 目标。

**3b. 备用方案：扫描所有目标（根所有者 + 子节点查找）**：

如果没有找到合适的直接子目标（或 `parentFrameId` 信息不完整），Pydoll 会退回到扫描**所有** iframe/page 目标：

1. 遍历所有 iframe/page 目标。
2. 附加到每个目标并获取其 frame 树。
3. 先尝试通过 `DOM.getFrameOwner(root_frame_id)` 将**根 frame 的所有者**与 iframe 的 `backendNodeId` 进行匹配。
4. 如果仍不匹配，则查找 `parentId` 等于我们的 `content_frame_id` 的**子 frame**（覆盖 OOPIF 由中间 frame 间接承载的情况）。

**代码**：

```python
# 源自 pydoll/interactions/iframe.py
async def _resolve_oopif_by_parent(
    self,
    content_frame_id: str,
    backend_node_id: Optional[int],
    base_handler: Optional[ConnectionHandler] = None,
    base_session_id: Optional[str] = None,
) -> tuple[Optional[ConnectionHandler], Optional[str], Optional[str], Optional[str]]:
    """使用 content frame id 解析 OOPIF。"""
    browser_handler = ConnectionHandler(
        connection_port=self._element._connection_handler._connection_port
    )
    targets_response: GetTargetsResponse = await browser_handler.execute_command(
        TargetCommands.get_targets()
    )
    target_infos = targets_response.get('result', {}).get('targetInfos', [])

    # 可以解析 DOM.getFrameOwner 的处理程序。
    # 当 <iframe> 位于嵌套 OOPIF 内部时，Tab 级处理程序没有可见性；
    # 我们必须通过最初发现该元素的会话路由。
    owner_handler = base_handler or self._element._connection_handler
    owner_session_id = base_session_id

    # 策略 3a：直接子目标（快速路径）
    direct_children = [
        target_info
        for target_info in target_infos
        if target_info.get('type') in {'iframe', 'page'}
        and target_info.get('parentFrameId') == content_frame_id
    ]

    is_single_child = len(direct_children) == 1
    for child_target in direct_children:
        attach_response: AttachToTargetResponse = await browser_handler.execute_command(
            TargetCommands.attach_to_target(
                target_id=child_target['targetId'], flatten=True
            )
        )
        attached_session_id = attach_response.get('result', {}).get('sessionId')
        if not attached_session_id:
            continue

        frame_tree = await self._get_frame_tree_for(browser_handler, attached_session_id)
        root_frame = (frame_tree or {}).get('frame', {})
        root_frame_id = root_frame.get('id', '')

        # 简单 / 同源场景：只有一个子目标且没有 backend_node_id
        if is_single_child and root_frame_id and backend_node_id is None:
            return (
                browser_handler,
                attached_session_id,
                root_frame_id,
                root_frame.get('url'),
            )

        # OOPIF 场景：通过 DOM.getFrameOwner 确认所有权
        if root_frame_id and backend_node_id is not None:
            owner_backend_id = await self._owner_backend_for(
                owner_handler, owner_session_id, root_frame_id
            )
            if owner_backend_id == backend_node_id:
                return (
                    browser_handler,
                    attached_session_id,
                    root_frame_id,
                    root_frame.get('url'),
                )

    # 策略 3b：扫描所有目标（根所有者 + 子节点查找）
    for target_info in target_infos:
        if target_info.get('type') not in {'iframe', 'page'}:
            continue
        attach_response = await browser_handler.execute_command(
            TargetCommands.attach_to_target(
                target_id=target_info.get('targetId', ''), flatten=True
            )
        )
        attached_session_id = attach_response.get('result', {}).get('sessionId')
        if not attached_session_id:
            continue

        frame_tree = await self._get_frame_tree_for(browser_handler, attached_session_id)
        root_frame = (frame_tree or {}).get('frame', {})
        root_frame_id = root_frame.get('id', '')

        # 直接匹配：content_frame_id 等于该目标的根 frame ID
        if root_frame_id and root_frame_id == content_frame_id:
            return (
                browser_handler,
                attached_session_id,
                root_frame_id,
                root_frame.get('url'),
            )

        # 优先尝试根据 backend_node_id 匹配根 frame 的所有者
        if root_frame_id and backend_node_id is not None:
            owner_backend_id = await self._owner_backend_for(
                owner_handler, owner_session_id, root_frame_id
            )
            if owner_backend_id == backend_node_id:
                return (
                    browser_handler,
                    attached_session_id,
                    root_frame_id,
                    root_frame.get('url'),
                )

        # 备用：查找 parentId 等于 content_frame_id 的子 frame
        child_frame_id = IFrameContextResolver._find_child_by_parent(
            frame_tree, content_frame_id
        )
        if child_frame_id:
            return browser_handler, attached_session_id, child_frame_id, None

    return None, None, None, None
```

**结果**：

- **如果 OOPIF 已解析**：我们现在有了 `sessionId`、`session_handler` 和 `frameId`；进入步骤 4。
- **如果解析失败**：抛出 `InvalidIFrame` 异常（在 `_ensure_iframe_context` 中处理）。

---

#### **步骤 4：创建隔离世界**

**目标**：在已解析的 frame 中创建一个独立的 JavaScript 执行上下文。

**方法**：`Page.createIsolatedWorld(frameId, worldName='pydoll::iframe::<frameId>', grantUniversalAccess=true)`

**参数**：
- `frameId`：在其中创建隔离世界的 frame
- `worldName`：世界的标识符（用于调试）
- `grantUniversalAccess`：允许跨域访问（自动化需要）

**响应**：`{ executionContextId: 42 }`

**代码**：

```python
# 源自 pydoll/elements/web_element.py
@staticmethod
async def _create_isolated_world_for_frame(
    frame_id: str,
    handler: ConnectionHandler,
    session_id: Optional[str],
) -> int:
    """为给定的 frame 创建一个隔离世界。"""
    create_command = PageCommands.create_isolated_world(
        frame_id=frame_id,
        world_name=f'pydoll::iframe::{frame_id}',
        grant_universal_access=True,
    )
    if session_id:
        create_command['sessionId'] = session_id
    create_response: CreateIsolatedWorldResponse = await handler.execute_command(create_command)
    execution_context_id = create_response.get('result', {}).get('executionContextId')
    if not execution_context_id:
        raise InvalidIFrame('无法为 iframe 创建隔离世界')
    return execution_context_id
```

**为什么需要隔离世界**：

- **隔离**：我们的自动化 JavaScript 不会干扰 iframe 的 JavaScript
- **反检测**：iframe 无法轻易检测到我们的存在
- **一致性**：无论 iframe 的脚本环境如何，行为都是可预测的

**结果**：我们有了一个 `executionContextId` 用于在 iframe 中运行 JavaScript。

---

#### **步骤 5：将 Iframe 文档固定为运行时对象**

**目标**：获取对 iframe 的 `document.documentElement`（iframe 的 `<html>` 元素）的 `objectId` 引用。

**方法**：`Runtime.evaluate(expression='document.documentElement', contextId=executionContextId)`

**为什么我们需要这个**：

- 以便在 iframe 内部执行**相对查询**（如 `element.querySelector()`）
- `objectId` 允许使用 `Runtime.callFunctionOn(objectId, ...)`，并将 `this` 绑定到 iframe 的文档

**代码**：

```python
# 源自 pydoll/elements/web_element.py
async def _set_iframe_document_object_id(self, execution_context_id: int) -> None:
    """在 iframe 上下文中评估 document.documentElement 并缓存其 object id。"""
    evaluate_command = RuntimeCommands.evaluate(
        expression='document.documentElement',
        context_id=execution_context_id,
    )
    if self._iframe_context and self._iframe_context.session_id:
        evaluate_command['sessionId'] = self._iframe_context.session_id
    evaluate_response: EvaluateResponse = await (
        (self._iframe_context.session_handler if self._iframe_context else None)
        or self._connection_handler
    ).execute_command(evaluate_command)
    result_object = evaluate_response.get('result', {}).get('result', {})
    document_object_id = result_object.get('objectId')
    if not document_object_id:
        raise InvalidIFrame('无法获取 iframe 的文档引用')
    if self._iframe_context:
        self._iframe_context.document_object_id = document_object_id
```

**结果**：`_IFrameContext` 现在已完全填充并缓存在 `WebElement` 上。

---

#### **步骤 6：缓存和传播上下文**

**目标**：将解析的上下文存储在 iframe 元素上，并将其传播到在 iframe 中找到的所有子元素。

**缓存**：

```python
# 源自 pydoll/elements/web_element.py
def _init_iframe_context(
    self,
    frame_id: str,
    document_url: Optional[str],
    session_handler: Optional[ConnectionHandler],
    session_id: Optional[str],
) -> None:
    """在此元素上初始化并缓存 iframe 上下文。"""
    self._iframe_context = _IFrameContext(frame_id=frame_id, document_url=document_url)
    # 清理路由属性（这些是用于嵌套 iframe 的）
    if hasattr(self, '_routing_session_handler'):
        delattr(self, '_routing_session_handler')
    if hasattr(self, '_routing_session_id'):
        delattr(self, '_routing_session_id')
    # 如果需要，存储 OOPIF 路由
    if session_handler and session_id:
        self._iframe_context.session_handler = session_handler
        self._iframe_context.session_id = session_id
```

**传播**（在 iframe 内部查找元素时）：

```python
# 源自 pydoll/elements/mixins/find_elements_mixin.py
def _apply_iframe_context_to_element(
    self, element: WebElement, iframe_context: _IFrameContext | None
) -> None:
    """将 iframe 上下文传播到新创建的元素。"""
    if not iframe_context:
        return
    
    # 如果子元素也是一个 iframe，设置路由
    if getattr(element, 'is_iframe', False):
        element._routing_session_handler = (
            iframe_context.session_handler or self._connection_handler
        )
        element._routing_session_id = iframe_context.session_id
        element._routing_parent_frame_id = iframe_context.frame_id
        return
    
    # 否则，注入父 iframe 的上下文
    element._iframe_context = iframe_context
```

**为什么传播很重要**：

- 在 iframe 内部找到的元素会继承 iframe 的上下文
- 这确保了后续操作（点击、键入、查找嵌套元素）自动使用正确的路由
- 嵌套的 iframes 接收路由信息，以便它们可以相对于父 iframe 解析自己的上下文

---

## 会话路由和扁平化模式

### 扁平化会话模型

正如在 [深度解析 → 基础 → CDP](./cdp.md) 中讨论的，传统的 CDP 对每个目标使用单独的 WebSocket 连接。**扁平化模式 (Flattened mode)** 是一种优化，所有目标共享一个 WebSocket 连接，命令使用 `sessionId` 进行路由。

```mermaid
graph TB
    subgraph "传统模式"
        WS1[WebSocket 1] --> MainPage[主页面目标]
        WS2[WebSocket 2] --> Iframe1[OOPIF 目标 1]
        WS3[WebSocket 3] --> Iframe2[OOPIF 目标 2]
    end
    
    subgraph "扁平化模式"
        WS[单个 WebSocket] --> Router{CDP 路由器}
        Router -->|sessionId: null| MainPage2[主页面目标]
        Router -->|sessionId: session-1| Iframe3[OOPIF 目标 1]
        Router -->|sessionId: session-2| Iframe4[OOPIF 目标 2]
    end
```

### 会话路由如何工作

**附加到 OOPIF 时**：

```python
response = await handler.execute_command(
    TargetCommands.attach_to_target(targetId="iframe-target-id", flatten=True)
)
session_id = response['result']['sessionId']  # 例如 "8E6C...-1234"
```

**向该 OOPIF 发送命令时**：

```python
command = PageCommands.get_frame_tree()
command['sessionId'] = 'session-1'  # 路由到 OOPIF
response = await handler.execute_command(command)
```

浏览器的 CDP 实现会根据 `sessionId` 将命令路由到正确的目标。

### Pydoll 的命令路由

Pydoll 元素发送的每个命令都会自动路由到正确的目标：

```python
# 源自 pydoll/elements/mixins/find_elements_mixin.py
def _resolve_routing(self) -> tuple[ConnectionHandler, Optional[str]]:
    """为当前上下文解析 handler 和 sessionId。"""
    # 检查元素是否具有带 OOPIF 路由的 iframe 上下文
    iframe_context = getattr(self, '_iframe_context', None)
    if iframe_context and getattr(iframe_context, 'session_handler', None):
        return iframe_context.session_handler, getattr(iframe_context, 'session_id', None)
    
    # 检查元素是否从父 iframe 继承了路由
    routing_handler = getattr(self, '_routing_session_handler', None)
    if routing_handler is not None:
        return routing_handler, getattr(self, '_routing_session_id', None)
    
    # 默认：使用标签页的主连接
    return self._connection_handler, None

async def _execute_command(
    self, command: Command[T_CommandParams, T_CommandResponse]
) -> T_CommandResponse:
    """通过解析的 handler 执行 CDP 命令（60 秒超时）。"""
    handler, session_id = self._resolve_routing()
    if session_id:
        command['sessionId'] = session_id
    return await handler.execute_command(command, timeout=60)
```

**路由逻辑**：

1. **OOPIF iframe 内的元素**：使用 `iframe_context.session_id` 和 `iframe_context.session_handler`
2. **嵌套 iframe（OOPIF 的子节点）**：使用继承的 `_routing_session_id` 和 `_routing_session_handler`
3. **常规元素或进程内 iframe**：使用主连接 (`_connection_handler`)，无 `sessionId`

### 扩展的命令类型

为了使 `sessionId` 类型安全，Pydoll 扩展了 `Command` TypedDict：

```python
# 源自 pydoll/protocol/base.py
class Command(TypedDict, Generic[T_CommandParams, T_CommandResponse]):
    """所有命令的基础结构。"""
    id: NotRequired[int]
    method: str
    params: NotRequired[T_CommandParams]
    sessionId: NotRequired[str]  # 为扁平化会话路由添加
```

这允许类型检查器将 `command['sessionId'] = '...'` 识别为有效，而无需抑制类型警告。

---

## 性能考量

### 缓存策略

**首次访问是昂贵的**：

- `DOM.describeNode`：1 次往返
- Frame 树检索：1+ 次往返（主目标 + OOPIF 目标）
- 每个 frame 的 `DOM.getFrameOwner`：N 次往返（最坏情况下）
- `Target.getTargets` + 附加：1 + M 次往返（M = OOPIF 目标数量）
- `Page.createIsolatedWorld`：1 次往返
- `Runtime.evaluate` (文档)：1 次往返

**总计**：根据页面结构，可能需要 5-20+ 次往返。

**后续访问是 O(1)**：

- `iframe_context` 缓存在 `WebElement` 实例上
- 多次访问 `await iframe.iframe_context` 会立即返回缓存的值
- 在 iframe 中找到的所有元素都会继承上下文（无需重新解析）

### 优化：直接子目标查找

在 `_resolve_oopif_by_parent` 中，Pydoll 首先按 `parentFrameId` 检查直接子节点：

```python
direct_children = [
    target_info
    for target_info in target_infos
    if target_info.get('type') in {'iframe', 'page'}
    and target_info.get('parentFrameId') == content_frame_id
]
if direct_children:
    # 立即附加，跳过扫描所有目标
```

**为什么这有帮助**：

- 大多数 OOPIFs 都正确设置了 `parentFrameId`
- 避免了推测性地附加到每个目标
- 在常见情况下，将往返次数从 O(目标数量) 减少到 O(1)

### 异步并行解析（未来增强）

目前，frame 所有者匹配是顺序的（逐个检查每个 frame）。未来的优化可以并行化：

```python
# 当前（顺序）
for frame_node in frames:
    owner = await self._owner_backend_for(...)
    if owner == backend_node_id:
        return frame_node['id']

# 潜在（并行）
results = await asyncio.gather(*(
    self._owner_backend_for(..., frame['id'])
    for frame in frames
))
for i, owner in enumerate(results):
    if owner == backend_node_id:
        return frames[i]['id']
```

这将把延迟从 `N * RTT` 减少到 `RTT`（其中 RTT = 往返时间）。

---

## 失败模式和调试

### 常见失败场景

#### 1. **InvalidIFrame: 无法解析 frameId**

**原因**：

- iframe 是动态创建的，尚未完全初始化
- iframe 被具有限制性策略的沙盒化
- 网络问题延迟了 iframe 加载

**解决方案**：

- **等待 iframe**：使用带超时的 `await tab.find(id='iframe', timeout=10)`
- **检查 sandbox 属性**：限制性沙盒 (`<iframe sandbox>`) 可能会阻止某些 CDP 操作
- **重试策略**：实现带指数退避的重试逻辑

**调试**：

```python
try:
    iframe = await tab.find(id='problem-iframe')
    context = await iframe.iframe_context
except InvalidIFrame as e:
    # 检查我们拥有的信息
    node_info = await iframe._describe_node(object_id=iframe._object_id)
    print(f"节点信息: {node_info}")
    
    # 手动检查 frame 树
    frame_tree = await WebElement._get_frame_tree_for(tab._connection_handler, None)
    print(f"Frame 树: {frame_tree}")
```

#### 2. **InvalidIFrame: 无法创建隔离世界**

**原因**：

- 在解析步骤之间，Frame 已被销毁/导航离开
- Chrome 错误（罕见）

**解决方案**：

- **重新解析上下文**：清除缓存的上下文并重新访问
- **检查导航**：确保 iframe 在解析期间没有导航

**调试**：

```python
# 清除缓存并重试
iframe._iframe_context = None
context = await iframe.iframe_context
```

#### 3. **InvalidIFrame: 无法获取文档引用**

**原因**：

- 隔离世界已创建，但文档尚未准备好
- Frame 即将导航

**解决方案**：

- 等待 frame 加载：使用 Page 事件检测 `Page.frameNavigated` 或 `Page.loadEventFired`
- 稍作延迟后重试

#### 4. **会话路由失败（命令超时或返回错误）**

**原因**：

- OOPIF 目标已分离（页面导航，iframe 被移除）
- `sessionId` 已过时

**解决方案**：

- **重新附加到目标**：创建一个新的 `ConnectionHandler` 并重新解析 OOPIF
- **验证目标**：调用 `Target.getTargets()` 检查目标是否仍然存在

**调试**：

```python
# 检查会话是否仍然有效
targets = await handler.execute_command(TargetCommands.get_targets())
active_sessions = [t['targetId'] for t in targets['result']['targetInfos']]
print(f"活动目标: {active_sessions}")

if iframe._iframe_context and iframe._iframe_context.session_id:
    print(f"我们的会话: {iframe._iframe_context.session_id}")
```

### 诊断工具

#### 启用 CDP 日志记录

```python
import logging
logging.basicConfig(level=logging.DEBUG)
logger = logging.getLogger('pydoll')
logger.setLevel(logging.DEBUG)
```

这将记录所有 CDP 命令和响应，有助于追踪 iframe 解析步骤。

#### 检查 iframe 上下文

```python
iframe = await tab.find(id='my-iframe')
ctx = await iframe.iframe_context

print(f"Frame ID: {ctx.frame_id}")
print(f"文档 URL: {ctx.document_url}")
print(f"执行上下文 ID: {ctx.execution_context_id}")
print(f"文档对象 ID: {ctx.document_object_id}")
print(f"会话 ID (OOPIF): {ctx.session_id}")
print(f"会话 Handler: {ctx.session_handler}")
```

---

## 结论

Pydoll 的 iframe 处理代表了对 CDP frame 管理能力的复杂实现。通过理解：

- **DOM**：树结构和节点标识
- **Iframes**：独立的文档上下文和安全边界
- **OOPIFs**：站点隔离和基于目标的架构
- **CDP 域**：Page、DOM、Target、Runtime 的协调
- **执行上下文**：用于纯净自动化的隔离世界
- **标识符**：backendNodeId、frameId、targetId、sessionId、executionContextId、objectId 之间的关系
- **解析管道**：用于查找 frames 的多阶段回退策略
- **会话路由**：扁平化模式和自动命令路由

您就能理解为什么 Pydoll 消除了手动上下文切换。这种复杂性是真实存在的，但 Pydoll 将其抽象在一个简单、直观的 API 背后：

```python
iframe = await tab.find(id='login-frame')
username = await iframe.find(name='username')
await username.type_text('user@example.com')
```

三行代码。没有上下文切换。没有目标附加。没有会话管理。它就是能用。

---

## 进一步阅读

- **CDP 规范**：[Chrome DevTools 协议 - Page 域](https://chromedevtools.github.io/devtools-protocol/tot/Page/)
- **CDP 规范**：[Chrome DevTools 协议 - DOM 域](https://chromedevtools.github.io/devtools-protocol/tot/DOM/)
- **CDP 规范**：[Chrome DevTools 协议 - Target 域](https://chromedevtools.github.io/devtools-protocol/tot/Target/)
- **CDP 规范**：[Chrome DevTools 协议 - Runtime 域](https://chromedevtools.github.io/devtools-protocol/tot/Runtime/)
- **Chromium 站点隔离**：[站点隔离 - Chromium 项目](https://www.chromium.org/Home/chromium-security/site-isolation/)
- **内容脚本和隔离世界**：[Chrome 扩展 - 内容脚本](https://developer.chrome.com/docs/extensions/mv3/content_scripts/)
- **Pydoll 文档**：[深度解析 → 基础 → Chrome DevTools 协议](./cdp.md)
- **Pydoll 文档**：[功能 → 自动化 → IFrames](../../features/automation/iframes.md)

---

!!! tip "设计理念"
    Pydoll iframe 处理的目标是**符合人体工程学的自动化**：编写代码时就好像 iframes 不存在一样，让库来处理复杂性。这次深度解析展示了幕后发生的事情——但在您的自动化脚本中，您永远不必考虑它。

================================================
FILE: docs/zh/deep-dive/fundamentals/index.md
================================================
# 核心基础

**掌握了基础，其他一切都会变得更容易。**

本节涵盖了 Pydoll 赖以运行的 **基石技术**：Chrome 开发者工具协议 (CDP)、基于 WebSocket 的异步通信以及 Python 的类型系统集成。这些不仅仅是实现细节，它们是使 Pydoll 快速、强大且类型安全的 **基本设计决策**。

## 为什么基础知识很重要

大多数自动化框架都将其通信层抽象化，留给您一个“黑匣子”，它能正常工作直到出现问题。当出现问题时，如果不了解底层机制，调试和优化将变得困难。

**Pydoll 采用了不同的方法**：我们揭示并解释基础知识，使您能够同时作为 **框架用户** 和 **协议工程师** 工作。

!!! quote "第一性原理的力量"
    **“通晓大道者，万物皆在其中。”** - 宫本武藏
    
    理解 CDP、异步通信和类型系统不仅仅是为了 Pydoll，它是为了从 **核心层面理解现代浏览器自动化是如何工作的**。这些知识可以转移到任何基于 CDP 的工具和任何异步 Python 项目中。

## 三大支柱

### 1. Chrome 开发者工具协议 (CDP)
**[→ 阅读 CDP 深度解析](./cdp.md)**

**驱动现代浏览器自动化的协议。**

CDP 是 Chrome 的原生调试协议，与 Chrome 开发者工具 (F12) 使用的协议相同。通过直接与 CDP 通信，Pydoll 能够：

- **消除 WebDriver**（没有 Selenium 开销，没有 geckodriver/chromedriver 中间件）
- **获得深度控制**（修改请求、拦截事件、执行特权操作）
- **实现原生速度**（直接 WebSocket 通信，无 HTTP 轮询）
- **变得无法检测**（没有 `navigator.webdriver`，没有 WebDriver 指纹）

**您将学到什么：**

- CDP 如何将功能组织到各个域中（Page, Network, DOM, Fetch 等）
- 驱动反应式自动化的命令/事件架构
- 为什么基于 CDP 的工具 **从根本上比 Selenium 更强大**
- 如何阅读 CDP 文档并扩展 Pydoll

**为什么这很重要**：CDP 不仅仅是 Pydoll 的实现细节，它是现代浏览器自动化的基础。Puppeteer、Playwright 和类似的工具都使用 CDP。一次理解，知识可通用于多种工具。

---

### 2. 连接层
**[→ 阅读连接层架构](./connection-layer.md)**

**正确实现的异步通信。**

CDP 定义了您 **能做什么**，而连接层则定义了 Pydoll **如何** 与浏览器通信。在这里，协议消息变成了 Python 对象，async/await 模式实现了并发，WebSocket 提供了实时的双向通信。

**您将学到什么：**

- WebSocket 架构：持久连接、消息分帧、心跳维持
- async/await 模式：为什么 `async def` 和 `await` 能实现并发自动化
- 命令/响应关联：Pydoll 如何将响应与请求匹配
- 事件分发：浏览器事件如何触发 Python 回调
- 错误处理：超时管理、连接失败、优雅降级

**为什么这很重要**：连接层是 Pydoll 的通信骨干。理解它有助于：
- **有效调试**：检查 Python 和 Chrome 之间流动的消息
- **性能优化**：识别延迟来源并使操作并行化
- **扩展能力**：添加自定义 CDP 命令或修改现有行为

---

### 3. Python 类型系统集成
**[→ 阅读类型系统深度解析](./typing-system.md)**

**类型同时提供安全性和生产力。**

Python 的类型系统（自 3.5 版引入，此后每个版本都有增强）显著改善了开发体验。Pydoll 利用 `TypedDict`, `Literal`, `overload` 和泛型来提供：

- **IDE 自动补全** CDP 响应字段
- **类型检查** 以在运行时之前捕获错误 (`mypy`, `pyright`)
- **自文档化代码**（函数签名揭示了结构）
- **重构安全**（重命名字段，IDE 会更新所有用法）

**您将学到什么：**

- `TypedDict` 如何为 CDP 事件/响应结构建模
- 为什么 `overload` 为 `find()` / `query()` 提供了精确的返回类型
- 泛型（`TypeVar`, `Generic[T]`）如何实现灵活的命令构建
- 实用模式：注解回调、为异步函数添加类型、使用 `Literal`
- 工具集成：配置 mypy、利用 IDE 类型推断

**为什么这很重要**：类型提示在现代 Python 中变得越来越重要。Pydoll 全面的类型覆盖意味着：
- **更快的开发**：自动补全揭示了可用的字段和方法
- **更少的错误**：类型检查器在错误进入生产环境前捕获它们
- **更好的重构**：借助 IDE 支持，自信地更改签名

---

## 这些基础知识如何相互连接

理解 CDP、异步通信和类型系统如何 **协同工作** 是关键：

```mermaid
graph TB
    Python[Python 代码:<br/>await tab.go_to#40;url#41;]
    
    Python --> TypeSystem[类型系统:<br/>函数签名揭示了<br/>参数和返回类型]
    
    TypeSystem --> ConnectionLayer[连接层:<br/>将命令序列化为 JSON,<br/>通过 WebSocket 发送]
    
    ConnectionLayer --> CDP[CDP:<br/>浏览器接收<br/>Page.navigate 命令]
    
    CDP --> Browser[Chrome:<br/>执行导航,<br/>发出事件]
    
    Browser --> CDPEvents[CDP 事件:<br/>Page.loadEventFired,<br/>Network.requestWillBeSent]
    
    CDPEvents --> ConnectionLayer2[连接层:<br/>反序列化事件,<br/>分派给回调]
    
    ConnectionLayer2 --> TypedDicts[TypedDict:<br/>事件数据作为<br/>类型化字典]
    
    TypedDicts --> PythonCallback[Python 回调:<br/>IDE 通过类型推断<br/>显示可用字段]
```

**流程**：
1.  您编写带有 **类型注解** 的 Python 代码（类型系统）
2.  代码序列化为 JSON 并通过 **WebSocket** 发送（连接层）
3.  浏览器接收并执行 **CDP 命令**（CDP）
4.  浏览器将 **CDP 事件** 发回（CDP）
5.  事件反序列化为 **TypedDict 实例**（类型系统）
6.  您的回调接收到 **类型安全的事件对象**（类型系统）

每一层都 **放大** 了其他层的作用：
- 类型使 CDP 响应易于发现
- CDP 的事件模型支持了异步模式
- 异步通信使类型变得至关重要（这个响应上有哪些字段？）

## 学习路径

我们推荐以下进阶路径：

### 步骤 1: CDP (1-2 小时)
**[从这里开始: Chrome 开发者工具协议](./cdp.md)**

理解驱动一切的协议。学习域、命令、事件以及如何阅读 CDP 文档。

**成果**：您将知道如何查找和使用任何 CDP 功能，而不仅仅是 Pydoll 暴露的功能。

### 步骤 2: 连接层 (2-3 小时)
**[继续: 连接层架构](./connection-layer.md)**

深入了解 WebSocket 通信、异步模式和事件分发。

**成果**：您将确切理解消息如何在 Python 和 Chrome 之间流动，从而实现调试和优化。

### 步骤 3: 类型系统 (1-2 小时)
**[完成: Python 类型系统](./typing-system.md)**

学习 Pydoll 如何使用现代 Python 类型来实现安全性和生产力。

**成果**：您将编写出具有完整 IDE 支持的类型安全的自动化代码，在运行前捕获错误。

**总时间**：4-7 小时
**回报**：对基于 CDP 的自动化基础的 **永久理解**

## 先决条件

要从本节中获得最大收益：

- **Python 基础知识** - 函数、类、装饰器
- **基本的 async/await** - 理解 `async def` 和 `await` 关键字
- **熟悉 JSON** - 知道对象/数组如何序列化
- **浏览器开发者工具** - 使用过 Chrome 检查器 (F12)

**如果您是 Python 异步编程的新手**，请先阅读：[Real Python: Async IO in Python](https://realpython.com/async-io-python/)

## 超越基础

掌握了这些基础知识后，您就可以开始学习：

- **[内部架构](../architecture/browser-domain.md)** - Pydoll 的组件是如何组合在一起的
- **[网络与安全](../network/index.md)** - 理解代理所需的协议级知识
- **[指纹识别](../fingerprinting/index.md)** - 需要 CDP 知识的检测技术

## 常见问题

### “我需要理解这些才能使用 Pydoll 吗？”

**不需要**，但理解这些基础知识将使您更有效率。基本用法在没有这些知识的情况下也能正常工作。然而，当您需要：
- 调试为什么某些功能不工作
- 优化缓慢的自动化
- 使用自定义 CDP 命令扩展 Pydoll
- 理解错误消息
- 为项目做贡献

这些基础知识就会变得非常有用。

### “这是不是太底层了？”

这种详细程度是故意的。大多数框架隐藏了这些基础知识，但抽象是有代价的：

- 理解有助于更好的调试
- 可见性有助于优化
- 知识有助于扩展

通过教授基础知识，我们使您能够超越 Pydoll 开箱即用的功能。

### “我需要记住多少内容？”

**一点也不用。** 目标是建立心智模型，而不是记忆。阅读完这些部分后，您将培养出一种直觉：

- “这需要 CDP，我去查查协议文档”
- “这很慢是因为顺序 await，让我来并行化”
- “这个类型错误意味着我用错了字段名”

具体细节会淡忘，但理解会长存。

## 理念

这些基础知识代表了持久的知识：

- **CDP** 是 Chrome 的原生协议，并持续演进
- **Async/await** 是 Python 的并发标准
- **类型系统** 在 Python 中变得越来越重要（PEP 484 以后）

学习这些概念将为您的整个开发生涯提供价值。

---

## 准备好奠定您的基础了吗？

从 **[Chrome 开发者工具协议](./cdp.md)** 开始，理解驱动一切的协议。然后逐步学习连接层和类型系统，以完善您的基础理解。

**这就是自动化成为工程学的地方。**

---

!!! tip "完成基础知识之后"
    一旦您掌握了这些概念，您会在 Pydoll 架构中 **无处不在** 地看到它们：
    
    - Browser/Tab/WebElement 都使用 **连接层**
    - 网络事件都遵循 **CDP 的事件模型**
    - 所有响应都使用 **TypedDict** 来确保类型安全
    
    基础知识与 Pydoll 并不分离，它们 **就是** Pydoll 的基石。

================================================
FILE: docs/zh/deep-dive/fundamentals/typing-system.md
================================================
# Python 的类型系统与 Pydoll

Pydoll 广泛利用 Python 的类型系统来提供出色的 IDE 支持、及早发现错误并使 API 自我记录。本指南将解释类型提示的基础知识，以及 Pydoll 如何使用它们来增强您的开发体验。

## 类型提示基础

类型提示是可选的注解，用于指定变量、参数或返回值应该是什么类型的值。它们不影响运行时行为，但能启用强大的工具。

### 简单类型提示

```python
# 基本类型
name: str = "Pydoll"
port: int = 9222
is_headless: bool = False
quality: float = 0.85

# 函数注解
def navigate(url: str, timeout: int = 30) -> bool:
    # ... 实现
    return True
```

### 容器类型

```python
from typing import List, Dict, Optional

# 列表和字典
urls: List[str] = ['https://example.com', 'https://google.com']
headers: Dict[str, str] = {'User-Agent': 'MyBot/1.0'}

# 可选值 (可以是 None)
target_id: Optional[str] = None

# 现代语法 (Python 3.9+)
urls: list[str] = ['https://example.com']
headers: dict[str, str] = {'User-Agent': 'MyBot/1.0'}
```

!!! tip "Python 3.9+ 语法"
    Pydoll 的代码库使用较旧的 `List[]`、`Dict[]` 语法以实现向后兼容，但如果您使用的是 Python 3.9+，您可以在代码中使用小写的 `list[]`、`dict[]`。

## TypedDict：结构化字典

TypedDict 允许您定义具有特定键和值类型的字典结构。这在 Pydoll 的 CDP 协议定义中被 **大量使用**。

### 基本 TypedDict

```python
from typing import TypedDict

class UserInfo(TypedDict):
    name: str
    age: int
    email: str

# IDE 完全知道存在哪些键
user: UserInfo = {
    'name': 'Alice',
    'age': 30,
    'email': 'alice@example.com'
}

# 自动补全功能可用！
print(user['name'])  # IDE 建议: name, age, email
```

### Pydoll 如何使用 TypedDict

Pydoll 将 **每个 CDP 命令、响应和事件** 定义为 TypedDict。这意味着您的 IDE 完全知道哪些属性可用：

```python
# 来自 pydoll/protocol/page/methods.py
class CaptureScreenshotParams(TypedDict, total=False):
    """captureScreenshot 的参数。"""
    format: ScreenshotFormat
    quality: int
    clip: Viewport
    fromSurface: bool
    captureBeyondViewport: bool
    optimizeForSpeed: bool

class CaptureScreenshotResult(TypedDict):
    """captureScreenshot 命令的结果。"""
    data: str
```

当您调用返回 CDP 响应的方法时，您的 IDE 会自动补全响应键：

```python
async def example():
    response = await tab.take_screenshot(as_base64=True)
    
    # IDE 知道这是 CaptureScreenshotResponse
    # 并建议 'result' -> 'data'
    screenshot_data = response['result']['data']  # 完整的自动补全！
```

### 可选字段与必选字段

TypedDict 使用 `NotRequired[]` 支持可选字段：

```python
from typing import TypedDict, NotRequired

# 来自 pydoll/protocol/network/methods.py
class GetCookiesParams(TypedDict):
    """用于检索浏览器 cookie 的参数。"""
    urls: NotRequired[list[str]]  # 此字段是可选的
```

`total=False` 标志使 **所有** 字段都可选：

```python
class CaptureScreenshotParams(TypedDict, total=False):
    format: ScreenshotFormat  # 所有字段都可选
    quality: int
    clip: Viewport
```

!!! info "自动补全的魔力"
    当您键入 `response['` 时，您的 IDE 会显示所有可用的键及其类型。这就是 TypedDict 的超能力在起作用！

## Enums (枚举)：类型安全的常量

枚举提供了类型安全的常量，您的 IDE 可以自动补全。Pydoll 广泛使用它们来表示 CDP 的值。

### 基本枚举

```python
from enum import Enum

class ScreenshotFormat(str, Enum):
    JPEG = 'jpeg'
    PNG = 'png'
    WEBP = 'webp'

# IDE 自动补全可用的格式
format = ScreenshotFormat.PNG  # 类型是 ScreenshotFormat
print(format.value)  # 'png'
```

### Pydoll 的枚举用法

```python
from pydoll.constants import Key
from pydoll.protocol.page.types import ScreenshotFormat
from pydoll.protocol.input.types import KeyModifier

# 查找元素 - 使用 kwargs，而非枚举
element = await tab.find(id='submit-btn')
element = await tab.find(class_name='btn-primary')
element = await tab.find(tag_name='button')

# 键盘输入 - IDE 建议所有键
await element.press_keyboard_key(Key.ENTER)
await element.press_keyboard_key(Key.TAB)
await element.press_keyboard_key(Key.ESCAPE)

# 修饰键是整数枚举 (用于特殊键)
await element.press_keyboard_key(Key.TAB, modifiers=KeyModifier.SHIFT)

# 截图格式枚举
await tab.take_screenshot('file.webp', format=ScreenshotFormat.WEBP)
```

!!! tip "枚举自动补全"
    键入 `Key.` 或 `ScreenshotFormat.`，您的 IDE 就会显示所有可用选项。再也不用记忆字符串了！

## 函数重载 (Function Overloads)

重载允许一个函数根据其参数返回不同的类型。Pydoll 使用它来提供精确的类型信息。

### 基本重载示例

```python
from typing import overload

# 重载签名 (不执行)
@overload
def process(data: str) -> str: ...

@overload
def process(data: int) -> int: ...

# 实际实现
def process(data):
    return data * 2

# IDE 知道返回类型
result1 = process("hello")  # 类型: str
result2 = process(42)       # 类型: int
```

### Pydoll 的重载用法

`find()` 和 `query()` 方法根据 `find_all` 参数返回不同的类型：

```python
# 来自 pydoll/elements/mixins/find_elements_mixin.py
class FindElementsMixin:
    @overload
    async def find(
        self, find_all: Literal[False] = False, **kwargs
    ) -> WebElement: ...
    
    @overload
    async def find(
        self, find_all: Literal[True], **kwargs
    ) -> list[WebElement]: ...
    
    async def find(
        self, find_all: bool = False, **kwargs
    ) -> Union[WebElement, list[WebElement]]:
        # 实现...
```

在您的代码中：

```python
# find_all=False (默认) - IDE 知道返回类型是 WebElement
button = await tab.find(id='submit-btn')
await button.click()  # 单个元素的方法可用！

# find_all=True - IDE 知道返回类型是 list[WebElement]
buttons = await tab.find(class_name='btn', find_all=True)
for btn in buttons:  # IDE 知道这是一个列表！
    await btn.click()

# query() 也是如此
element = await tab.query('#submit-btn')  # 类型: WebElement
elements = await tab.query('.btn', find_all=True)  # 类型: list[WebElement]
```

!!! tip "智能类型推断"
    您的 IDE 会根据 `find_all` 参数自动知道您获取的是单个元素还是列表。无需类型转换或类型断言！

## 泛型 (Generic Types)

泛型就像“类型容器”，可以与不同类型一起工作，同时保留类型信息。可以把它们想象成能适应您放入任何东西的模板。

### 理解泛型：一个简单的类比

想象一个可以装任何东西的 `Box`。没有泛型：

```python
# 没有泛型 - IDE 不知道里面是什么
class Box:
    def __init__(self, content):
        self.content = content
    
    def get(self):
        return self.content

my_box = Box("hello")
item = my_box.get()  # 类型: Unknown - 可能是任何东西！
```

使用泛型：

```python
from typing import Generic, TypeVar

T = TypeVar('T')  # T 是一个 "类型占位符"

class Box(Generic[T]):
    def __init__(self, content: T):
        self.content = content
    
    def get(self) -> T:
        return self.content

# 现在 IDE 完全知道每个盒子里装的是什么
string_box: Box[str] = Box("hello")
item1 = string_box.get()  # 类型: str

number_box: Box[int] = Box(42)
item2 = number_box.get()  # 类型: int

# List 是一个内置的泛型
numbers: list[int] = [1, 2, 3]  # 包含 int 的列表
names: list[str] = ["Alice", "Bob"]  # 包含 str 的列表
```

!!! tip "泛型简化了类型提示"
    泛型让您只需编写一个可重用的 `list[T]`，它能适应您放入的任何东西，而无需为每种可能的列表类型编写 `Union[List[str], List[int], List[float], ...]`。

### 现实世界中的泛型示例

```python
from typing import TypeVar, Generic

T = TypeVar('T')

class Response(Generic[T]):
    """一个通用的 API 响应包装器。"""
    def __init__(self, data: T, status: int):
        self.data = data
        self.status = status
    
    def get_data(self) -> T:
        return self.data

# 每个响应都保留了其数据类型
user_response: Response[dict] = Response({"name": "Alice"}, 200)
user_data = user_response.get_data()  # 类型: dict

count_response: Response[int] = Response(42, 200)
count = count_response.get_data()  # 类型: int
```

### Pydoll 如何使用泛型

Pydoll 的 CDP 命令系统使用泛型来确保响应类型与命令匹配：

```python
# 来自 pydoll/protocol/base.py
from typing import Generic, TypeVar

T_CommandParams = TypeVar('T_CommandParams')
T_CommandResponse = TypeVar('T_CommandResponse')

class Command(TypedDict, Generic[T_CommandParams, T_CommandResponse]):
    """所有命令的基础结构。"""
    id: NotRequired[int]
    method: str
    params: NotRequired[T_CommandParams]

class Response(TypedDict, Generic[T_CommandResponse]):
    """所有响应的基础结构。"""
    id: int
    result: T_CommandResponse
```

这意味着当您执行一个命令时，响应类型会被自动推断：

```python
# PageCommands.navigate 返回 Command[NavigateParams, NavigateResult]
command = PageCommands.navigate('https://example.com')

# ConnectionHandler.execute_command 保留了泛型类型
response = await connection_handler.execute_command(command)

# IDE 知道 response['result'] 是 NavigateResult (不仅仅是 "any dict")
frame_id = response['result']['frameId']  # 自动补全可用！
loader_id = response['result']['loaderId']  # 所有字段都已知！
```

!!! info "为什么泛型在 Pydoll 中很重要"
    没有泛型，每个 CDP 响应的类型都只是 `dict[str, Any]`，您将失去所有的自动补全功能。有了泛型，IDE 能根据您发送的命令知道每个响应的确切结构。

## 联合类型 (Union Types)

联合 (Union) 表示值可能是多种类型之一：

```python
from typing import Union

# 可以是字符串或整数
identifier: Union[str, int] = "user-123"
identifier = 456  # 也有效

# 现代语法 (Python 3.10+)
identifier: str | int = "user-123"
```

### Pydoll 的联合类型用法

```python
# 文件路径可以是字符串或 Path 对象
from pathlib import Path

async def upload_file(files: Union[str, Path, list[Union[str, Path]]]):
    # 处理多种输入类型
    pass

# 所有这些都有效：
await tab.expect_file_chooser('/path/to/file.txt')
await tab.expect_file_chooser(Path('/path/to/file.txt'))
await tab.expect_file_chooser(['/file1.txt', Path('/file2.txt')])
```

## Pydoll 中的实际好处

### 1. 智能自动补全

您的 IDE 会建议可用的键、方法和值：

```python
from pydoll.protocol.page.events import PageEvent
from pydoll.protocol.network.types import ResourceType
from pydoll.protocol.input.types import KeyModifier
from pydoll.constants import Key

# 自动补全事件名称
await tab.on(PageEvent.LOAD_EVENT_FIRED, callback)
await tab.on(PageEvent.JAVASCRIPT_DIALOG_OPENING, callback)

# 自动补全资源类型
await tab.enable_fetch_events(resource_type=ResourceType.XHR)
await tab.enable_fetch_events(resource_type=ResourceType.DOCUMENT)

# 自动补全按键
await element.press_keyboard_key(Key.ENTER)
await element.press_keyboard_key(Key.TAB, modifiers=KeyModifier.SHIFT)

# 自动补全 find() 中的 kwargs
element = await tab.find(id='submit-btn')  # IDE 建议: id, class_name, tag_name, 等.
```

### 2. 及早发现错误

像 mypy 或 Pylance 这样的类型检查器会在运行时之前捕获错误：

```python
# 类型检查器会捕获这个
await tab.take_screenshot('file.png', quality='high')  # 错误: quality 必须是 int

# 类型检查器会捕获这个
event = await tab.find(id='button')
await tab.on(event, callback)  # 错误: event 是 WebElement, 不是 str

# 正确的
await tab.take_screenshot('file.png', quality=90)
await tab.on(PageEvent.LOAD_EVENT_FIRED, callback)
```

### 3. 自我记录的代码

类型可作为内联文档：

```python
# 您立即知道每个参数期望什么
async def take_screenshot(
    self,
    path: Optional[str] = None,
    quality: int = 100,
    beyond_viewport: bool = False,
    as_base64: bool = False,
) -> Optional[str]:
    pass
```

### 4. CDP 响应导航

自信地浏览复杂的 CDP 响应：

```python
# 来自 pydoll/protocol/browser/methods.py
class GetVersionResult(TypedDict):
    protocolVersion: str
    product: str
    revision: str
    userAgent: str
    jsVersion: str

# 在您的代码中
version_info = await browser.get_version()

# IDE 建议所有可用的键
print(version_info['product'])         # 自动补全！
print(version_info['userAgent'])       # 自动补全！
print(version_info['protocolVersion']) # 自动补全！
```

## 类型检查您的代码

### 使用 Pylance (VS Code)

Pylance 在 VS Code 中提供实时类型检查：

1.  安装 Pylance 扩展
2.  在设置中设置类型检查模式：

```json
{
    "python.analysis.typeCheckingMode": "basic"  // 或 "strict"
}
```

现在您可以获得即时反馈：

```python
from pydoll.browser.chromium import Chrome

async def main():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # 当您键入时，Pylance 会显示参数类型
        await tab.go_to('https://example.com', timeout=30)
        
        # Pylance 会对错误的类型发出警告
        await tab.take_screenshot(quality='high')  # 警告！
```

### 使用 mypy

运行 mypy 来检查您的整个项目：

```bash
pip install mypy
mypy your_script.py
```

示例输出：

```
your_script.py:10: error: Argument "quality" to "take_screenshot" has incompatible type "str"; expected "int"
Found 1 error in 1 file (checked 1 source file)
```

## Pydoll 的协议类型系统

Pydoll 的 `protocol/` 目录包含整个 Chrome DevTools 协议的全面类型定义：

```
pydoll/protocol/
├── base.py              # 泛型 Command, Response, CDPEvent 类型
├── browser/
│   ├── events.py        # BrowserEvent 枚举, 事件参数 TypedDicts
│   ├── methods.py       # Browser 方法枚举, 参数/结果 TypedDicts
│   └── types.py         # Browser 域类型 (Bounds, PermissionType, 等.)
├── dom/
│   ├── events.py        # DOM 事件定义
│   ├── methods.py       # DOM 命令定义
│   └── types.py         # DOM 类型 (Node, BackendNode, 等.)
├── page/
│   ├── events.py        # Page 事件 (LOAD_EVENT_FIRED, 等.)
│   ├── methods.py       # Page 方法 (navigate, captureScreenshot, 等.)
│   └── types.py         # Page 类型 (Frame, ScreenshotFormat, 等.)
├── network/
│   └── ...              # Network 域类型
└── ...                  # 其他 CDP 域
```

### 示例：完整的类型流

让我们追踪一个从命令到响应的完整类型流：

```python
# 1. 方法枚举 (protocol/page/methods.py)
class PageMethod(str, Enum):
    CAPTURE_SCREENSHOT = 'Page.captureScreenshot'

# 2. 参数 TypedDict (protocol/page/methods.py)
class CaptureScreenshotParams(TypedDict, total=False):
    format: ScreenshotFormat
    quality: int
    clip: Viewport

# 3. 结果 TypedDict (protocol/page/methods.py)
class CaptureScreenshotResult(TypedDict):
    data: str

# 4. 命令创建 (commands/page_commands.py)
class PageCommands:
    @staticmethod
    def capture_screenshot(
        format: Optional[ScreenshotFormat] = None,
        quality: Optional[int] = None,
        ...
    ) -> Command[CaptureScreenshotParams, CaptureScreenshotResult]:
        return {
            'method': PageMethod.CAPTURE_SCREENSHOT,
            'params': {...}
        }

# 5. 在 Tab 中使用 (browser/tab.py)
class Tab:
    async def take_screenshot(...) -> Optional[str]:
        response: CaptureScreenshotResponse = await self._execute_command(
            PageCommands.capture_screenshot(...)
        )
        screenshot_data = response['result']['data']  # 完全类型化！
        return screenshot_data
```

每一步都保留了类型信息，让您在整个过程中都能获得自动补全和类型检查！

## 最佳实践

### 1. 让 Pydoll 的类型引导您

不要抗拒类型，它们是来帮助您的：

```python
# 好的：使用 kwargs (IDE 自动补全参数名称)
element = await tab.find(id='submit-btn')
button = await tab.find(class_name='btn-primary')

# 好的：在适用的地方使用枚举
from pydoll.constants import Key
await element.press_keyboard_key(Key.ENTER)

# 避免：魔法字符串
await element.press_keyboard_key('Enter')  # 没有自动补全，容易出错
```

### 2. 在您的 IDE 中探索类型

将鼠标悬停在变量上以查看其类型：

```python
# 悬停在 'response' 上查看: Response[CaptureScreenshotResult]
response = await tab._execute_command(PageCommands.capture_screenshot(...))

# 悬停在 'data' 上查看: str
data = response['result']['data']
```


### 3. 不要过度注解

Python 的类型推断很智能，不要注解所有东西：

```python
# 过多
name: str = "Alice"
count: int = 5
is_active: bool = True

# 让 Python 推断简单的字面量
name = "Alice"
count = 5
is_active = True

# 当类型不明显时进行注解
from typing import Optional

result: Optional[WebElement] = await tab.find(id='missing', raise_exc=False)
```

## 了解更多

要更深入地了解 Python 的类型系统和 CDP 协议：

- **[Python typing 文档](https://docs.python.org/3/library/typing.html)**：官方 Python 类型参考
- **[PEP 484](https://peps.python.org/pep-0484/)**：原始的类型提示提案
- **[Chrome DevTools Protocol](https://chromedevtools.github.io/devtools-protocol/)**：CDP 文档
- **[深入探讨：CDP](./cdp.md)**：Pydoll 如何实现 CDP
- **[API 参考：Protocol](../api/protocol/base.md)**：Pydoll 的协议类型定义

类型系统将 Pydoll 从一个简单的自动化库转变为一个 **类型安全、自我记录、IDE 友好** 的框架。它能在错误发生之前捕获它们，并使探索 API 变得轻而易举！

================================================
FILE: docs/zh/deep-dive/guides/index.md
================================================
# 实用指南

**理论与实践相结合，为应对真实自动化挑战提供可行的模式。**

“深度探讨”的其他部分探讨了 **基础知识** 和 **架构**，而本节则为常见的自动化场景提供了 **经过实战检验的实用指南**。这些不是学术练习，而是通过生产使用提炼出来的模式。

## 指南的目的

您已经学过：
- **[基础知识](../fundamentals/cdp.md)** - CDP、异步、类型
- **[架构](../architecture/browser-domain.md)** - 内部设计模式
- **[网络](../network/index.md)** - 协议和代理
- **[指纹识别](../fingerprinting/index.md)** - 检测与规避

那么现在呢？**您如何将这些知识应用于实际问题？**

这就是指南的作用：**连接理论与实践**。

!!! quote "实践智慧"
    **“理论上，理论和实践是一样的。实践中，它们并非如此。”** - 瑜伽·贝拉 (Yogi Berra)
    
    指南将复杂的技术知识提炼为您可以立即使用的 **可操作模式**。它们向您展示了在生产中 **哪些方法有效**，而不仅仅是理论上可能的东西。

## 当前指南

### CSS 选择器 vs XPath
**[→ 阅读选择器指南](./selectors-guide.md)**

**用数据和最佳实践解决永恒的辩论。**

在 CSS 选择器和 XPath 之间做出选择，无关偏好。关键在于理解 **权衡**、**性能特征** 和 **可维护性**。

**您将学到什么**：

- **语法比较** - 常见模式的并排示例
- **性能基准** - 真实的测量数据，而非神话
- **强大功能 vs 简洁性** - 当 CSS 不够用时（文本匹配、轴）
- **浏览器支持** - 兼容性和边缘情况
- **最佳实践** - 何时使用哪种，应避免的反模式
- **复杂示例** - 解决真实世界的选择器挑战

**为什么这很重要**：元素定位是自动化的 **基础**。选错工具，您将永远与选择器作斗争。明智地选择，自动化将变得简单明了。

---

## 即将推出

### Asyncio 与并发自动化
**将在未来版本中推出**

**深入探讨 Python 的 asyncio：事件循环内部原理、实用的并发模式以及真实世界的示例。**

理解 asyncio 对 Pydoll 至关重要。本指南将全面分析 Python 的事件循环、并发原语，以及如何将它们应用于浏览器自动化而避免陷阱。

**将涵盖**：

- **事件循环内部原理**：`asyncio.run()` 是如何工作的、任务调度和执行流程
- **Async/Await 深入探讨**：协程、future 和异步状态机
- **并发原语**：`gather()`、`create_task()`、`TaskGroup` 以及何时使用它们
- **速率限制**：信号量、队列和节流策略
- **真实世界示例**：多标签页抓取、并行表单填充、协调的浏览器实例
- **常见陷阱**：阻塞事件循环、任务取消、异常传播
- **性能分析**：分析异步代码、识别瓶颈、优化 I/O

**为什么这很重要**：Asyncio 是 Pydoll 架构的动力源泉。掌握它，您就能在没有竞争条件或状态损坏的情况下实现真正的并发自动化。

---

### 架构模式与健壮的选择器
**将在未来版本中推出**

**PageObject 模式、可维护的选择器以及用于可扩展自动化的架构方法。**

从临时脚本转向结构化、可维护的自动化架构。学习可从简单脚本扩展到生产系统的模式。

**将涵盖**：

- **PageObject 模式**：封装页面结构、减少重复、提高可维护性
- **健壮的选择器策略**：构建能在页面变更后幸存的选择器，避免脆弱的定位器
- **组件抽象**：用于常见 UI 模式（模态框、下拉菜单、表格）的可重用组件
- **等待策略**：超越简单超时的智能等待模式
- **状态管理**：跨页面和流程管理自动化状态
- **测试模式**：如何构建易于测试的自动化代码
- **真实世界架构**：可用于生产的项目结构和组织

**为什么这很重要**：临时脚本和可维护自动化系统之间的区别在于架构。学习使您的代码能够适应变化的模式。

---

## 指南的理念

指南遵循一致的原则：

### 1. 可用于生产的代码
所有示例都是 **完整且经过测试的**，而不是伪代码或简化的演示。您可以复制粘贴并根据需要进行调整。

### 2. 真实世界的场景
指南解决的是在生产自动化中遇到的 **实际问题**，而不是虚构的例子。

### 3. 权衡分析
当存在多种方法时，指南会客观地 **比较** 它们，并提供优缺点，而不仅仅是“这是一种方法”。

### 4. 渐进的复杂性
从简单开始，逐步增加复杂性。首先是基本模式，然后是边缘情况和高级变体。

### 5. 突出显示反模式
明确展示 **不该做什么**，以及通过代码审查或生产调试发现的常见错误。

## 如何使用指南

指南是 **参考材料**，而不是按顺序学习的教程：

- **浏览** 与您当前问题相关的模式
- **收藏** 您需要重复使用的指南
- **调整** 示例以适应您的特定情境
- **组合** 来自多个指南的模式

不要按顺序从头到尾阅读。
不要在不理解权衡的情况下盲目复制。
不要使用过时的模式（请检查发布日期）。

## 贡献指南

有值得分享的模式吗？指南是 **由社区驱动的**：

**怎样才是一篇好的指南**：

- 解决了在生产中遇到的 **实际问题**
- 提供了 **可工作的代码**，而不仅仅是概念
- 比较了 **多种方法** 并进行了权衡
- 明确指出了 **常见错误**
- 解释了 **为什么**，而不仅仅是 **怎么做**

有关提交指南，请参阅 [贡献](../../CONTRIBUTING.md)。

## 指南 vs 功能文档

**对两者的区别感到困惑吗？**

|| 功能文档 | 深度探讨指南 |
|---|---|---|
| **目的** | 教授 Pydoll 能做什么 | 展示如何解决问题 |
| **范围** | 单个方法/功能 | 多个功能组合 |
| **深度** | API 参考 + 示例 | 模式 + 权衡 + 最佳实践 |
| **顺序** | 按组件构建 | 按问题构建 |
| **示例** | 简单、独立 | 复杂、可用于生产 |

**使用功能文档**：学习 Pydoll 的 API
**使用指南**：解决真实的自动化挑战

## 超越指南

掌握了实用模式之后：

- **[架构](../architecture/browser-domain.md)** - 理解模式为何有效
- **[网络](../network/index.md)** - 网络层面的优化
- **[指纹识别](../fingerprinting/evasion-techniques.md)** - 反检测技术

指南提供 **直接价值**。架构提供 **深刻理解**。两者都能让您变得高效。

---

## 准备好学习实用模式了吗？

从 **[CSS 选择器 vs XPath](./selectors-guide.md)** 开始，掌握元素定位——这是所有自动化的基础。

**更多指南即将推出。请给本仓库加星以保持更新！**

---

!!! tip "请求一篇指南"
    您有什么希望被记录下来的自动化模式吗？请提交一个标题为“指南请求：[主题]”的 issue，描述：
    
    - 您试图解决的问题
    - 您到目前为止尝试了什么
    - 为什么现有文档没有涵盖它
    
    我们将根据社区需求优先安排指南。

## 快速参考

**现已推出：**
- [CSS 选择器 vs XPath](./selectors-guide.md)

**即将推出：**
- Asyncio 与并发自动化
- 架构模式与健壮的选择器

**时间表**：根据社区反馈和生产经验添加新指南。

================================================
FILE: docs/zh/deep-dive/guides/selectors-guide.md
================================================
# CSS 选择器 vs XPath：完整指南

使用 `query()` 方法时，您有两种强大的选择器语言可供选择：CSS 选择器和 XPath。了解何时以及如何使用每种语言对于有效的元素定位至关重要。

## 根本差异

| 方面 | CSS 选择器 | XPath |
|---|---|---|
| **语法** | 简单，类似 CSS | XML 路径语言 |
| **性能** | 更快 (浏览器原生支持) | 稍慢 |
| **方向** | 只能向下和横向遍历 | 可以向任何方向遍历 |
| **文本匹配** | 有限 (伪选择器) | 强大的文本函数 |
| **复杂性** | 最适合简单到中等的情况 | 擅长处理复杂关系 |
| **可读性** | Web 开发人员更直观 | 学习曲线更陡峭 |

## 何时使用 CSS 选择器

CSS 选择器是以下情况的理想选择：

- 通过 ID、类或标签进行简单的元素选择
- 直接的父子关系
- 具有简单模式的属性匹配
- 对性能要求严格的场景
- 在 DOM 中向下遍历时

```python
# 简洁高效的 CSS 示例
await tab.query("#login-form")
await tab.query(".submit-button")
await tab.query("div.container > p.intro")
await tab.query("input[type='email'][required]")
await tab.query("ul.menu li:first-child")
```

## 何时使用 XPath

XPath 是以下情况的理想选择：

- 复杂的文本匹配和部分文本搜索
- 向上遍历到父元素
- 查找相对于兄弟元素的元素
- 选择器中的条件逻辑
- 复杂的 DOM 关系

```python
# 强大的 XPath 示例
await tab.query("//button[contains(text(), 'Submit')]")
await tab.query("//input[@name='email']/parent::div")
await tab.query("//td[text()='John']/following-sibling::td[2]")
await tab.query("//div[contains(@class, 'product') and @data-price > 100]")
```

## CSS 选择器语法参考

### 基本选择器

```python
# 元素选择器
await tab.query("div")              # 第一个 <div> 元素
await tab.query("div", find_all=True)  # 所有 <div> 元素
await tab.query("button")           # 第一个 <button> 元素

# ID 选择器
await tab.query("#username")        # id="username" 的元素

# 类选择器
await tab.query(".submit-btn")      # 第一个 class="submit-btn" 的元素
await tab.query(".submit-btn", find_all=True)  # 所有带该类的元素
await tab.query(".btn.primary")     # 第一个同时具有这两个类的元素

# 通用选择器
await tab.query("*", find_all=True) # 所有元素
```

### 组合器

```python
# 后代组合器 (空格)
await tab.query("div p")            # <div> 内的第一个 <p>
await tab.query("div p", find_all=True)  # <div> 内的所有 <p> (任何深度)

# 子组合器 (>)
await tab.query("div > p")          # <div> 直接子元素中的第一个 <p>
await tab.query("div > p", find_all=True)  # 所有作为直接子元素的 <p>

# 相邻兄弟组合器 (+)
await tab.query("h1 + p")           # 紧跟 <h1> 后的 <p>

# 通用兄弟组合器 (~)
await tab.query("h1 ~ p")           # <h1> 后的第一个 <p> 兄弟元素
await tab.query("h1 ~ p", find_all=True)  # <h1> 后的所有 <p> 兄弟元素
```

### 属性选择器

```python
# 属性存在
await tab.query("input[required]")                # 第一个带 'required' 的 input
await tab.query("input[required]", find_all=True) # 所有带 'required' 的 input

# 属性等于
await tab.query("input[type='email']")            # 第一个 email input
await tab.query("input[type='email']", find_all=True)  # 所有 email input

# 属性包含单词
await tab.query("div[class~='active']")           # 第一个 class 中包含 'active' 的 div

# 属性以...开头
await tab.query("a[href^='https://']")            # 第一个 HTTPS 链接
await tab.query("a[href^='https://']", find_all=True)  # 所有 HTTPS 链接

# 属性以...结尾
await tab.query("img[src$='.png']")               # 第一个 PNG 图像
await tab.query("img[src$='.png']", find_all=True)     # 所有 PNG 图像

# 属性包含子字符串
await tab.query("a[href*='example']")             # 第一个 href 中包含 'example' 的链接
await tab.query("a[href*='example']", find_all=True)   # 所有 href 中包含 'example' 的链接

# 不区分大小写匹配
await tab.query("input[type='text' i]")           # 不区分大小写匹配
```

### 伪类

```python
# 结构伪类
await tab.query("li:first-child")                 # 作为第一个子元素的第一个 <li>
await tab.query("li:last-child")                  # 作为最后一个子元素的第一个 <li>
await tab.query("li:nth-child(2)")                # 作为第二个子元素的第一个 <li>
await tab.query("li:nth-child(odd)", find_all=True)  # 所有奇数位置的 <li>
await tab.query("li:nth-child(even)", find_all=True)  # 所有偶数位置的 <li>
await tab.query("li:nth-child(3n)", find_all=True)    # 每第 3 个 <li>

# 类型伪类
await tab.query("p:first-of-type")                # 兄弟元素中的第一个 <p>
await tab.query("p:last-of-type")                 # 兄弟元素中的最后一个 <p>
await tab.query("p:nth-of-type(2)")               # 兄弟元素中的第二个 <p>

# 状态伪类
await tab.query("input:enabled")                  # 第一个启用的 input
await tab.query("input:enabled", find_all=True)   # 所有启用的 input
await tab.query("input:disabled")                 # 第一个禁用的 input
await tab.query("input:checked")                  # 第一个选中的 checkbox/radio
await tab.query("input:focus")                    # 当前获得焦点的 input

# 其他有用的伪类
await tab.query("div:empty")                      # 第一个空元素
await tab.query("div:empty", find_all=True)       # 所有空元素
await tab.query("div:not(.exclude)")              # 第一个没有 'exclude' 类的 div
await tab.query("div:not(.exclude)", find_all=True)  # 所有没有 'exclude' 类的 div
```

## XPath 语法参考

### 基本路径表达式

```python
# 绝对路径 (从根开始)
await tab.query("/html/body/div")                 # 处于该精确路径的第一个 div

# 相对路径 (从任何地方开始)
await tab.query("//div")                          # 第一个 <div> 元素
await tab.query("//div", find_all=True)           # 所有 <div> 元素
await tab.query("//div/p")                        # 任何 <div> 内的第一个 <p>
await tab.query("//div/p", find_all=True)         # 任何 <div> 内的所有 <p>

# 当前节点
await tab.query("./div")                          # 相对于当前的第一个 <div>

# 父节点
await tab.query("..")                             # 当前节点的父节点
```

### 属性选择

```python
# 基本属性匹配
await tab.query("//input[@type='email']")         # 第一个 email input
await tab.query("//input[@type='email']", find_all=True)  # 所有 email input
await tab.query("//div[@id='content']")           # id='content' 的 div

# 多个属性
await tab.query("//input[@type='text' and @required]")  # 第一个匹配项
await tab.query("//input[@type='text' and @required]", find_all=True)  # 所有匹配项
await tab.query("//div[@class='card' or @class='panel']")  # 第一个 card 或 panel

# 属性存在
await tab.query("//button[@disabled]")            # 第一个 disabled button
await tab.query("//button[@disabled]", find_all=True)  # 所有 disabled button
```

## XPath 轴 (方向导航)

XPath 的真正威力来自于它能够在 DOM 树中向任何方向导航。

### 轴参考表

| 轴 | 方向 | 描述 | 示例 |
|---|---|---|---|
| `child::` | 向下 | 仅直接子元素 | `//div/child::p` |
| `descendant::` | 向下 | 所有后代 (任何深度) | `//div/descendant::a` |
| `parent::` | 向上 | 直接父元素 | `//input/parent::div` |
| `ancestor::` | 向上 | 所有祖先 (任何深度) | `//span/ancestor::div` |
| `following-sibling::` | 横向 | 当前元素之后的所有兄弟元素 | `//h1/following-sibling::p` |
| `preceding-sibling::` | 横向 | 当前元素之前的所有兄弟元素 | `//p/preceding-sibling::h1` |
| `following::` | 向前 | 当前节点之后的所有节点 | `//h1/following::*` |
| `preceding::` | 向后 | 当前节点之前的所有节点 | `//h1/preceding::*` |
| `ancestor-or-self::` | 向上 | 祖先 + 当前节点 | `//div/ancestor-or-self::*` |
| `descendant-or-self::` | 向下 | 后代 + 当前节点 | `//div/descendant-or-self::*` |
| `self::` | 当前 | 仅当前节点 | `//div/self::div` |
| `attribute::` | 属性 | 当前节点的属性 | `//div/attribute::class` |

!!! info "简写语法"
    - `//div` 是 `//descendant-or-self::div` 的简写
    - `//div/p` 是 `//div/child::p` 的简写
    - `@id` 是 `attribute::id` 的简写
    - `..` 是 `parent::node()` 的简写

### 实用轴示例

```python
# 导航到父元素
await tab.query("//input[@name='email']/parent::div")
await tab.query("//span[@class='error']/..")       # 简写

# 查找祖先元素
await tab.query("//input/ancestor::form")          # 第一个祖先 <form>
await tab.query("//button/ancestor::div[@class='modal']")

# 兄弟元素导航
await tab.query("//label[text()='Email:']/following-sibling::input")
await tab.query("//h2/following-sibling::p[1]")    # <h2> 后的第一个 <p>
await tab.query("//h2/following-sibling::p", find_all=True)  # <h2> 后的所有 <p>
await tab.query("//button/preceding-sibling::input[last()]")

# 复杂关系
await tab.query("//tr/td[1]/following-sibling::td[2]")  # 第一行中的第 3 个单元格
await tab.query("//tr/td[1]/following-sibling::td[2]", find_all=True)  # 所有行中的第 3 个单元格
```

## XPath 函数

### 文本函数

```python
# 精确文本匹配
await tab.query("//button[text()='Submit']")

# 包含文本
await tab.query("//p[contains(text(), 'welcome')]")

# 以...开头
await tab.query("//a[starts-with(@href, 'https://')]")

# 文本规范化 (移除多余的空白)
await tab.query("//button[normalize-space(text())='Submit']")

# 字符串长度
await tab.query("//input[string-length(@value) > 5]")

# 字符串连接
await tab.query("//div[concat(@data-first, @data-last)='JohnDoe']")
```

### 数字函数

```python
# 位置匹配
await tab.query("//li[position()=1]")              # 第一个 <li>
await tab.query("//li[position() > 3]", find_all=True)  # 第 3 个之后的所有 <li>
await tab.query("//li[last()]")                    # 最后一个 <li>
await tab.query("//li[last()-1]")                  # 倒数第二个

# 计数
await tab.query("//ul[count(li) > 5]")             # 第一个包含超过 5 个 li 的 <ul>
await tab.query("//ul[count(li) > 5]", find_all=True)  # 所有包含超过 5 个 li 的 <ul>

# 数值运算
await tab.query("//div[@data-price > 100]")        # 第一个 price > 100 的 div
await tab.query("//div[@data-price > 100]", find_all=True)  # 所有
await tab.query("//div[number(@data-stock) = 0]")  # 第一个 stock = 0 的
```

### 布尔函数

```python
# 布尔逻辑
await tab.query("//div[@visible='true' and @enabled='true']")  # 第一个匹配项
await tab.query("//input[@type='text' or @type='email']")  # 第一个 text 或 email
await tab.query("//input[@type='text' or @type='email']", find_all=True)  # 所有
await tab.query("//button[not(@disabled)]")        # 第一个启用的 button
await tab.query("//button[not(@disabled)]", find_all=True)  # 所有启用的 button

# 存在性检查
await tab.query("//div[child::p]")                 # 第一个有 <p> 子元素的 div
await tab.query("//div[child::p]", find_all=True)  # 所有有 <p> 子元素的 div
await tab.query("//div[not(child::*)]")            # 第一个空 div
await tab.query("//div[not(child::*)]", find_all=True)  # 所有空 div
```

## XPath 谓词 (Predicates)

谓词使用方括号 `[]` 中的条件来过滤节点集。

```python
# 位置谓词
await tab.query("(//div)[1]")                      # 文档中的第一个 <div>
await tab.query("(//div)[last()]")                 # 文档中的最后一个 <div>
await tab.query("//ul/li[3]")                      # <ul> 中的第一个第 3 个 <li>
await tab.query("//ul/li[3]", find_all=True)       # 每个 <ul> 中的所有第 3 个 <li>

# 多个谓词 (AND 逻辑)
await tab.query("//input[@type='text'][@required]")  # 第一个匹配项
await tab.query("//div[@class='product'][position() < 4]", find_all=True)  # 前 3 个

# 属性谓词
await tab.query("//div[@data-id='123']")
await tab.query("//a[contains(@class, 'button')]")  # 第一个匹配的链接
await tab.query("//input[starts-with(@name, 'user')]")  # 第一个匹配的 input
```

## 真实世界示例：复杂元素查找

让我们使用一个真实的 HTML 结构来演示高级选择器。

### 示例 HTML 结构

```html
<div class="dashboard">
    <header>
        <h1>User Dashboard</h1>
        <nav class="menu">
            <a href="/home" class="active">Home</a>
            <a href="/profile">Profile</a>
            <a href="/settings">Settings</a>
        </nav>
    </header>
    
    <main>
        <section class="products">
            <h2>Available Products</h2>
            <table id="products-table">
                <thead>
                    <tr>
                        <th>Product Name</th>
                        <th>Price</th>
                        <th>Stock</th>
                        <th>Actions</th>
                    </tr>
                </thead>
                <tbody>
                    <tr data-product-id="101">
                        <td>Laptop</td>
                        <td class="price">$999</td>
                        <td class="stock">15</td>
                        <td>
                            <button class="btn-edit">Edit</button>
                            <button class="btn-delete">Delete</button>
                        </td>
                    </tr>
                    <tr data-product-id="102">
                        <td>Mouse</td>
                        <td class="price">$25</td>
                        <td class="stock">0</td>
                        <td>
                            <button class="btn-edit">Edit</button>
                            <button class="btn-delete" disabled>Delete</button>
                        </td>
                    </tr>
                    <tr data-product-id="103">
                        <td>Keyboard</td>
                        <td class="price">$75</td>
                        <td class="stock">8</td>
                        <td>
                            <button class="btn-edit">Edit</button>
                            <button class="btn-delete">Delete</button>
                        </td>
                    </tr>
                </tbody>
            </table>
        </section>
        
        <section class="user-form">
            <h2>User Information</h2>
            <form id="user-form">
                <div class="form-group">
                    <label for="username">Username:</label>
                    <input type="text" id="username" name="username" required>
                    <span class="error-message" style="display:none;">Invalid username</span>
                </div>
                <div class="form-group">
                    <label for="email">Email:</label>
                    <input type="email" id="email" name="email" required>
                    <span class="error-message" style="display:none;">Invalid email</span>
                </div>
                <div class="form-group">
                    <input type="checkbox" id="newsletter" name="newsletter">
                    <label for="newsletter">Subscribe to newsletter</label>
                </div>
                <button type="submit" class="btn-primary">Save Changes</button>
                <button type="button" class="btn-secondary">Cancel</button>
            </form>
        </section>
    </main>
</div>
```

### 挑战 1：查找活动的导航链接

**目标**：找到当前活动的导航链接。

```python
# CSS 选择器
active_link = await tab.query("nav.menu a.active")

# XPath
active_link = await tab.query("//nav[@class='menu']//a[@class='active']")

# 获取其文本
text = await active_link.text
print(text)  # "Home"
```

### 挑战 2：查找特定产品的编辑按钮

**目标**：找到产品 "Mouse" 的编辑按钮 (不知道其行位置)。

```python
# XPath (推荐用于此情况)
edit_button = await tab.query(
    "//tr[td[text()='Mouse']]//button[contains(@class, 'btn-edit')]"
)

# 备选方案：使用 following-sibling
edit_button = await tab.query(
    "//td[text()='Mouse']/following-sibling::td//button[@class='btn-edit']"
)
```

!!! tip "为什么这里使用 XPath？"
    CSS 选择器无法向上遍历找到行，然后再向下找到按钮。XPath 在 DOM 中自由移动的能力使这变得微不足道。

### 挑战 3：查找所有价格超过 $50 的产品

**目标**：获取价格大于 $50 的所有表格行。

```python
# 带有数值比较的 XPath
expensive_products = await tab.query(
    "//tr[number(translate(td[@class='price'], '$,', '')) > 50]",
    find_all=True
)

# 更易读的版本：对于更简单的情况使用 contains
# 这会查找价格包含特定金额的产品
products = await tab.query("//tr[contains(td[@class='price'], '$75')]", find_all=True)
```

!!! note "文本到数字的转换"
    `translate()` 函数移除了 `$` 和 `,` 字符，然后 `number()` 将其转换为数值进行比较。

### 挑战 4：查找所有缺货产品

**目标**：找到所有库存为 0 的产品。

```python
# XPath
out_of_stock = await tab.query(
    "//tr[td[@class='stock' and text()='0']]",
    find_all=True
)

# 备选方案：查找所有行并检查库存
rows = await tab.query("//tbody/tr[td[@class='stock']/text()='0']", find_all=True)
```

### 挑战 5：通过标签查找输入字段

**目标**：首先定位其标签，然后找到 email 输入字段。

```python
# XPath 使用 label 的 'for' 属性
email_input = await tab.query("//label[text()='Email:']/following-sibling::input")

# 备选方案：使用 for 属性
email_input = await tab.query("//input[@id=(//label[text()='Email:']/@for)]")

# 更通用的：按标签文本查找
username_input = await tab.query(
    "//label[contains(text(), 'Username')]/following-sibling::input"
)
```

### 挑战 6：查找 Email 字段旁的错误消息

**目标**：获取出现在 email 输入字段旁边的错误消息 span。

```python
# XPath - 查找 email input 的错误兄弟元素
error_span = await tab.query(
    "//input[@id='email']/following-sibling::span[@class='error-message']"
)

# 备选方案：从父 div 导航
error_span = await tab.query(
    "//input[@id='email']/parent::div//span[@class='error-message']"
)

# 检查可见性
is_visible = await error_span.is_visible()
```

### 挑战 7：查找提交按钮 (而不是取消按钮)

**目标**：找到提交按钮，排除取消按钮。

```python
# CSS 选择器 (简单)
submit_button = await tab.query("button[type='submit']")
submit_button = await tab.query("button.btn-primary")

# 带文本的 XPath
submit_button = await tab.query("//button[text()='Save Changes']")

# 排除其他的 XPath
submit_button = await tab.query(
    "//button[@type='submit' and not(@class='btn-secondary')]"
)
```

### 挑战 8：查找所有必填的表单字段

**目标**：获取表单中所有必填的 input 字段。

```python
# CSS 选择器 (简洁)
required_fields = await tab.query(
    "#user-form input[required]",
    find_all=True
)

# XPath
required_fields = await tab.query(
    "//form[@id='user-form']//input[@required]",
    find_all=True
)

# 验证
for field in required_fields:
    field_name = await field.get_attribute("name")
    print(f"Required: {field_name}")
```

### 挑战 9：查找第一个未禁用的删除按钮

**目标**：找到第一个未被禁用的删除按钮。

```python
# CSS 选择器
first_enabled_delete = await tab.query("button.btn-delete:not([disabled])")

# XPath
first_enabled_delete = await tab.query(
    "//button[contains(@class, 'btn-delete') and not(@disabled)]"
)

# 获取所有启用的删除按钮
all_enabled = await tab.query(
    "//button[@class='btn-delete' and not(@disabled)]",
    find_all=True
)
```

### 挑战 10：按多个条件查找表格行

**目标**：查找库存 > 0 且价格 < $100 的产品。

```python
# 具有复杂逻辑的 XPath
available_affordable = await tab.query(
    """
    //tr[
        number(td[@class='stock']) > 0 
        and 
        number(translate(td[@class='price'], '$', '')) < 100
    ]
    """,
    find_all=True
)

# 对于每个匹配的产品
for row in available_affordable:
    cells = await row.query("td", find_all=True)
    product_name = await cells[0].text
    print(f"Available: {product_name}")
```

### 挑战 11：导航复杂关系

**目标**：从删除按钮获取同一行中的产品名称。

```python
# 从删除按钮开始
delete_button = await tab.query("//tr[@data-product-id='101']//button[@class='btn-delete']")

# 导航到父行，然后到第一个单元格
product_name_cell = await delete_button.query("./ancestor::tr/td[1]")
product_name = await product_name_cell.text
print(product_name)  # "Laptop"

# 备选方案：首先获取整行
row = await delete_button.query("./ancestor::tr")
product_id = await row.get_attribute("data-product-id")
print(product_id)  # "101"
```

### 挑战 12：同时查找复选框及其标签

**目标**：找到 newsletter 复选框并验证其标签。

```python
# 查找复选框
checkbox = await tab.query("#newsletter")

# 使用 'for' 属性获取关联的标签
label = await tab.query("//label[@for='newsletter']")
label_text = await label.text
print(label_text)  # "Subscribe to newsletter"

# 备选方案：从复选框导航到标签
label = await checkbox.query("//following::label[@for='newsletter']")

# 检查是否选中
is_checked = await checkbox.is_checked()
```

## 高级模式：动态构建选择器

处理动态内容时，您可能需要以编程方式构建选择器：

```python
async def find_product_by_name(tab, product_name: str):
    """通过名称动态查找产品行。"""
    # 转义产品名称中的引号以防止 XPath 注入
    safe_name = product_name.replace("'", "\\'")
    
    xpath = f"//tr[td[text()='{safe_name}']]"
    return await tab.query(xpath)

async def find_table_cell(tab, row_text: str, column_index: int):
    """通过行内容和列位置查找特定单元格。"""
    xpath = f"//tr[td[contains(text(), '{row_text}')]]/td[{column_index}]"
    return await tab.query(xpath)

# 用法
product_row = await find_product_by_name(tab, "Laptop")
price_cell = await find_table_cell(tab, "Laptop", 2)
price = await price_cell.text
print(price)  # "$999"
```

## 性能比较

```python
import asyncio
import time

async def benchmark_selectors(tab):
    """比较 CSS 与 XPath 的性能。"""
    
    # 预热
    await tab.query("#products-table")
    
    # 基准测试 CSS
    start = time.time()
    for _ in range(100):
        await tab.query("#products-table tbody tr", find_all=True)
    css_time = time.time() - start
    
    # 基准测试 XPath
    start = time.time()
    for _ in range(100):
        await tab.query("//table[@id='products-table']//tbody//tr", find_all=True)
    xpath_time = time.time() - start
    
    print(f"CSS: {css_time:.3f}s")
    print(f"XPath: {xpath_time:.3f}s")
    print(f"CSS is {xpath_time/css_time:.2f}x faster")

# 典型结果：对于简单选择器，CSS 快 1.2-1.5 倍
```

!!! warning "性能 vs 可读性"
    虽然 CSS 选择器通常更快，但对于单个查询，差异通常可以忽略不计（毫秒级）。请选择使您的代码更具可读性和可维护性的选择器，特别是对于 XPath 擅长的复杂关系。

## 选择器最佳实践

### 1. 优先使用稳定的选择器

```python
# 好的：使用语义属性
await tab.query("#user-email")
await tab.query("[data-testid='submit-button']")
await tab.query("input[name='username']")

# 避免：基于结构的脆弱选择器
await tab.query("div > div > div:nth-child(3) > input")
await tab.query("body > div:nth-child(2) > form > div:first-child")
```

### 2. 使用能工作的最简单的选择器

```python
# 好的：简单高效
await tab.query("#login-form")
await tab.query(".submit-button")

# 避免：在不必要时过度复杂化
await tab.query("//div[@id='content']/descendant::form[@id='login-form']")
```

### 3. 适当组合 find() 和 query()

```python
# 使用 find() 进行简单的属性匹配
username = await tab.find(id="username")
submit = await tab.find(tag_name="button", type="submit")

# 使用 query() 处理复杂模式
active_link = await tab.query("nav.menu a.active")
error_msg = await tab.query("//input[@name='email']/following-sibling::span[@class='error']")
```

### 4. 为复杂的选择器添加注释

```python
# 查找包含产品 "Laptop" 的行中的 "Edit" 按钮
# XPath: 导航到带有 "Laptop" 文本的行, 然后查找编辑按钮
edit_button = await tab.query(
    "//tr[td[text()='Laptop']]//button[@class='btn-edit']"
)
```

## 结论

通过理解 CSS 选择器和 XPath，以及它们各自的优势和用例，您可以创建出健壮且可维护的浏览器自动化，以处理现代 Web 应用程序的复杂性。请记住：

- **使用 CSS 选择器** 进行简单的、对性能要求严格的选择
- **使用 XPath** 处理复杂关系、文本匹配和向上导航
- 编写选择器时，**选择稳定性** 而非简洁性
- **注释复杂的查询** 以保持代码的可读性

有关 Pydoll 内部如何使用这些选择器的更多信息，请参阅 [FindElements Mixin](find-elements-mixin.md) 文档。

================================================
FILE: docs/zh/deep-dive/index.md
================================================
# 深度探讨：技术基础

**欢迎来到 Pydoll 的技术核心，在这里我们将探索驱动浏览器自动化的系统和协议。**

本节提供了关于网络抓取、浏览器自动化、网络协议和反检测技术的全面技术教育。我们不只关注使用模式，而是探讨底层机制，从第一个 TCP 数据包到最终渲染的像素。

## 是什么让这里与众不同

大多数自动化文档教您 **如何使用工具**。本节教您 **互联网实际上是如何工作的**，以及如何在每一层对其进行操控：

- **网络协议** (TCP/IP, TLS, HTTP/2) - 每个请求背后的无形基础
- **浏览器内部原理** (CDP, 渲染引擎, JavaScript 上下文) - Chrome 内部发生了什么
- **检测系统** (指纹识别, 行为分析, 代理检测) - 网站如何识别机器人
- **规避技术** (CDP 覆盖, 一致性强制, 人类模拟) - 如何变得无法检测

!!! quote "理念"
    **“任何足够先进的技术都与魔法无异。”**
    
    本节旨在通过解释底层系统来揭开浏览器自动化的神秘面纱。理解这些基础知识将使您在自动化工作中获得更好的控制力和可预测性。

## 知识的架构

本节分为 **五个渐进的层次**，每个层次都建立在上一层的基础上：

### 核心基础
**[→ 探索基础知识](./fundamentals/cdp.md)**

从基础开始：理解驱动 Pydoll 的协议和系统。

- **[Chrome 开发者工具协议](./fundamentals/cdp.md)** - Pydoll 如何绕过 WebDriver 与浏览器对话
- **[连接层](./fundamentals/connection-layer.md)** - WebSocket 架构、异步模式、实时 CDP
- **[Python 类型系统](./fundamentals/typing-system.md)** - 类型安全、用于 CDP 的 TypedDict、IDE 集成

**为什么从这里开始**：理解 CDP 和异步通信为理解浏览器自动化的所有其他方面奠定了基础。

---

### 内部架构
**[→ 探索架构](./architecture/browser-domain.md)**

更上一层楼：了解 Pydoll 的内部组件如何协同工作。

- **[浏览器域](./architecture/browser-domain.md)** - 进程管理、上下文、多配置文件自动化
- **[标签页域](./architecture/tab-domain.md)** - 标签页生命周期、并发操作、iframe 处理
- **[WebElement 域](./architecture/webelement-domain.md)** - 元素交互、Shadow DOM、属性处理
- **[FindElements Mixin](./architecture/find-elements-mixin.md)** - 选择器策略、DOM 遍历、优化
- **[事件架构](./architecture/event-architecture.md)** - 反应式事件系统、回调、异步分发
- **[浏览器请求架构](./architecture/browser-requests-architecture.md)** - 浏览器上下文中的 HTTP

**为什么这很重要**：了解内部架构可以揭示从表面使用中看不出来的优化机会和设计模式。

---

### 网络与安全
**[→ 探索网络与安全](./network/index.md)**

深入协议层：了解数据如何在互联网上传输。

- **[网络基础](./network/network-fundamentals.md)** - OSI 模型、TCP/UDP、WebRTC 泄露
- **[HTTP/HTTPS 代理](./network/http-proxies.md)** - 应用层代理、CONNECT 隧道
- **[SOCKS 代理](./network/socks-proxies.md)** - 会话层代理、UDP 支持、安全
- **[代理检测](./network/proxy-detection.md)** - 匿名级别、检测技术、规避
- **[构建代理服务器](./network/build-proxy.md)** - 完整的 HTTP 和 SOCKS5 实现
- **[法律与道德](./network/proxy-legal.md)** - GDPR、CFAA、合规性、负责任的使用

**关键见解**：网络特征是在操作系统级别确定的。声称的浏览器身份与网络级指纹之间的不匹配可以被复杂的反机器人系统检测到。

---

### 指纹识别
**[→ 探索指纹识别](./fingerprinting/index.md)**

了解浏览器自动化的检测系统和规避技术。

- **[网络指纹](./fingerprinting/network-fingerprinting.md)** - TCP/IP, TLS/JA3, p0f, Nmap, Scapy
- **[浏览器指纹](./fingerprinting/browser-fingerprinting.md)** - HTTP/2, Canvas, WebGL, JavaScript API
- **[规避技术](./fingerprinting/evasion-techniques.md)** - CDP 覆盖、一致性、实用代码

**关键见解**：每次连接都会揭示众多特征（canvas 渲染、TCP 窗口大小、TLS 密码顺序）。有效的隐蔽需要在所有检测层保持一致性。

---

### 实用指南
**[→ 探索指南](./guides/selectors-guide.md)**

应用您的知识：应对常见自动化挑战的实用指南。

- **[CSS 选择器 vs XPath](./guides/selectors-guide.md)** - 选择器语法、性能、最佳实践

**即将推出**：更多实用指南，将技术知识融合成可操作的模式。

---

## 学习路径

不同的目标需要不同的知识。选择您的路径：

### 路径 1：隐蔽自动化
**目标：构建无法检测的抓取工具**

1.  **[指纹识别概述](./fingerprinting/index.md)** - 了解检测环境
2.  **[网络指纹](./fingerprinting/network-fingerprinting.md)** - TCP/IP, TLS 签名
3.  **[浏览器指纹](./fingerprinting/browser-fingerprinting.md)** - Canvas, WebGL, HTTP/2
4.  **[规避技术](./fingerprinting/evasion-techniques.md)** - 基于 CDP 的对策
5.  **[网络与安全](./network/index.md)** - 代理选择和配置
6.  **[浏览器域](./architecture/browser-domain.md)** - 上下文隔离、进程管理

**时间投入**：12-16 小时的深度技术学习
**回报**：能够绕过复杂的反机器人系统

---

### 路径 2：架构精通
**目标：为 Pydoll 做贡献或构建类似的工具**

1.  **[CDP 深度探讨](./fundamentals/cdp.md)** - 协议基础
2.  **[连接层](./fundamentals/connection-layer.md)** - WebSocket 异步模式
3.  **[事件架构](./architecture/event-architecture.md)** - 事件驱动设计
4.  **[浏览器域](./architecture/browser-domain.md)** - 浏览器管理
5.  **[标签页域](./architecture/tab-domain.md)** - 标签页生命周期
6.  **[WebElement 域](./architecture/webelement-domain.md)** - 元素交互
7.  **[Python 类型系统](./fundamentals/typing-system.md)** - 类型安全集成

**时间投入**：16-20 小时的架构学习
**回报**：深入理解浏览器自动化的内部原理

---

### 路径 3：网络工程
**目标：掌握代理、指纹和网络级隐蔽技术**

1.  **[网络基础](./network/network-fundamentals.md)** - OSI 模型, TCP/UDP, WebRTC
2.  **[网络指纹](./fingerprinting/network-fingerprinting.md)** - TCP/IP 签名, TLS/JA3
3.  **[HTTP/HTTPS 代理](./network/http-proxies.md)** - 应用层代理
4.  **[SOCKS 代理](./network/socks-proxies.md)** - 会话层代理
5.  **[代理检测](./network/proxy-detection.md)** - 匿名与规避
6.  **[构建代理服务器](./network/build-proxy.md)** - 从头开始实现

**时间投入**：14-18 小时的网络协议学习
**回报**：完全理解网络级的匿名与检测

---

## 先决条件

这是高级技术材料。推荐的先决条件包括：

- **Python 基础** - 类、async/await、上下文管理器、装饰器
- **基本网络知识** - IP 地址、端口、HTTP 协议
- **Pydoll 基础** - 参见 [功能特性](../features/core-concepts.md) 和 [快速入门](../index.md)
- **浏览器开发者工具** - Chrome 检查器、网络选项卡、控制台

**如果您对这些不熟悉**，我们建议：

1.  首先完成 [功能特性](../features/index.md) 部分
2.  使用 Pydoll 练习基本的自动化
3.  当您需要更深入的理解时再回到这里

## 精通的理念

Web 自动化涉及多个专业领域：

- **协议工程** - 理解 TCP/IP, TLS, HTTP/2
- **系统编程** - 管理进程, 异步 I/O, WebSocket
- **安全研究** - 指纹, 检测, 规避
- **浏览器内部原理** - 渲染, JavaScript 上下文, CDP
- **操作安全** - 法律合规, 道德准则

大多数开发者是随着时间的推移独立学习这些知识的。本节通过以下方式整合了这些知识：

1.  **集中知识** - 不再需要分散的博客文章和学术论文
2.  **提供背景** - 从第一性原理出发解释每种技术
3.  **提供可用代码** - 所有示例都可用于生产
4.  **引用来源** - 每个声明都有 RFC、文档或研究支持
5.  **渐进的复杂性** - 每个部分都建立在先前的知识之上

## 文档标准

本文档代表了广泛的研究、测试和验证：

- 每个协议细节都根据 RFC 进行了验证
- 每种指纹技术都在生产环境中进行了测试
- 每个代码示例都无需修改即可运行
- 每个声明都引用了权威来源
- 每个图表都根据真实系统行为生成

在整个文档中，技术准确性和实际适用性是优先考虑的。

## 合乎道德的使用

拥有这些知识的同时也伴随着责任：

!!! danger "负责任地使用"
    此处描述的技术既可用于合法的自动化，也可用作恶意目的。负责任的使用包括：
    
    - 尊重网站的服务条款和 robots.txt
    - 实现速率限制和友好的爬行
    - 考虑自动化是否真的必要
    - 在不确定时咨询法律顾问
    - 在适当的时候对您的自动化保持透明
    
    避免将此知识用于：
    - 欺诈、账户滥用或非法活动
    - 以侵略性的抓取压垮服务器
    - 在不了解后果的情况下进行有害活动

有关详细指导，请参阅 **[法律与道德考量](./network/proxy-legal.md)**。

## 贡献

发现错误？有建议？看到过时的东西？

本文档是一个 **动态的项目**。指纹技术在发展，协议在更新，新的规避方法在出现。我们欢迎以下贡献：

- 纠正技术上的不准确之处
- 添加新的指纹技术
- 更新协议信息
- 改进代码示例
- 扩展对检测系统的覆盖

有关指南，请参阅 [贡献](../CONTRIBUTING.md)。

---

## 开始入门

根据您的目标选择一条路径：

**刚接触深度技术内容？**
→ 从 **[Chrome 开发者工具协议](./fundamentals/cdp.md)** 开始，了解 Pydoll 的基础

**需要隐蔽自动化？**
→ 跳转到 **[指纹识别](./fingerprinting/index.md)** 了解检测和规避技术

**想要网络级的控制？**
→ 探索 **[网络与安全](./network/index.md)** 了解代理架构和协议

**正在构建自动化基础设施？**
→ 学习 **[内部架构](./architecture/browser-domain.md)** 了解设计模式

**只是想浏览一下？**
→ 从侧边栏任选一个主题，每篇文章都是自成体系的

---

!!! success "技术深度探讨"
    本节提供了浏览器自动化的全面技术知识，从基础协议到高级规避技术。
    
    请按您自己的节奏探索。

================================================
FILE: docs/zh/deep-dive/network/build-proxy.md
================================================
# 构建代理服务器

本文档使用 Python asyncio 从零实现 HTTP 和 SOCKS5 代理服务器。目标不是生产就绪，而是协议理解：观察每个字节如何被解析、安全边界在哪里，以及为什么真实的代理软件中存在某些设计决策。

!!! info "模块导航"
    - [网络基础](./network-fundamentals.md)：TCP/IP、UDP、WebRTC
    - [HTTP/HTTPS 代理](./http-proxies.md)：应用层代理
    - [SOCKS 代理](./socks-proxies.md)：会话层代理
    - [代理检测](./proxy-detection.md)：检测技术与规避

    有关在 Pydoll 中实际使用代理的方法，请参阅[代理配置](../../features/configuration/proxy.md)。

!!! warning "教育用途代码"
    这些实现以清晰度为优先，而非健壮性。它们缺少连接限制、访问控制列表以及生产代理所需的许多错误恢复路径。请勿将它们暴露于不受信任的网络中。

## HTTP 代理

HTTP 代理以两种模式运行。对于明文 HTTP，它接收完整的请求（带有绝对形式的 URL，例如 `GET http://example.com/path HTTP/1.1`），将请求目标重写为原始形式（`GET /path HTTP/1.1`），连接到目标服务器，转发请求，然后将响应传回。对于 HTTPS，客户端发送 `CONNECT host:port` 请求，代理打开到目标的 TCP 连接，以 `200 Connection Established` 响应，然后在两个方向之间盲目中继字节，不检查加密内容。

下面的实现处理了这两种模式。阅读代码时需要注意几点。`_pipe_data` 方法在一端关闭时调用 `write_eof()`，这会向另一端发送 TCP FIN。如果不这样做，隧道会无限挂起，因为另一端的 `read()` 永远不会返回空字节。HTTP 转发路径使用相同的管道方法而不是单次 `read()` 调用，因为 HTTP 响应可以任意大，固定大小的读取会静默截断它们。请求目标重写保留了查询字符串，仅使用 `urlparse().path` 会丢失它们。

```python
import asyncio
import base64
import contextlib
import logging
from urllib.parse import urlparse

logger = logging.getLogger(__name__)


class HTTPProxy:
    """带有可选 Basic 认证的异步 HTTP/HTTPS 代理。"""

    def __init__(self, host='0.0.0.0', port=8080, username=None, password=None):
        self.host = host
        self.port = port
        self.username = username
        self.password = password

    async def start(self):
        server = await asyncio.start_server(
            self._handle_client, self.host, self.port
        )
        logger.info(f'HTTP proxy listening on {self.host}:{self.port}')
        async with server:
            await server.serve_forever()

    async def _handle_client(self, reader, writer):
        try:
            request_line = await asyncio.wait_for(
                reader.readline(), timeout=30
            )
            if not request_line:
                return

            parts = request_line.decode('latin-1').split()
            if len(parts) != 3:
                writer.write(b'HTTP/1.1 400 Bad Request\r\n\r\n')
                await writer.drain()
                return

            method, url, _ = parts
            headers = await self._read_headers(reader)

            if not self._check_auth(headers):
                writer.write(
                    b'HTTP/1.1 407 Proxy Authentication Required\r\n'
                    b'Proxy-Authenticate: Basic realm="Proxy"\r\n'
                    b'Content-Length: 0\r\n\r\n'
                )
                await writer.drain()
                return

            if method == 'CONNECT':
                await self._handle_connect(url, reader, writer)
            else:
                await self._handle_http(method, url, headers, reader, writer)
        except Exception as e:
            logger.error(f'Client handler error: {e}')
        finally:
            writer.close()
            await writer.wait_closed()

    async def _read_headers(self, reader):
        headers = {}
        while True:
            line = await reader.readline()
            if line in (b'\r\n', b'\n', b''):
                break
            if b':' in line:
                key, value = line.decode('latin-1').split(':', 1)
                headers[key.strip().lower()] = value.strip()
        return headers

    def _check_auth(self, headers):
        if not self.username:
            return True
        auth = headers.get('proxy-authorization', '')
        if not auth.startswith('Basic '):
            return False
        try:
            decoded = base64.b64decode(auth[6:]).decode('utf-8')
            if ':' not in decoded:
                return False
            user, pwd = decoded.split(':', 1)
            return user == self.username and pwd == self.password
        except Exception:
            return False

    async def _handle_connect(self, target, client_reader, client_writer):
        """为 HTTPS 建立盲 TCP 隧道。"""
        # 解析 host:port，处理 IPv6 字面量如 [::1]:443
        if target.startswith('['):
            bracket_end = target.index(']')
            host = target[1:bracket_end]
            port = int(target[bracket_end + 2:])
        elif ':' in target:
            host, port_str = target.rsplit(':', 1)
            port = int(port_str)
        else:
            client_writer.write(b'HTTP/1.1 400 Bad Request\r\n\r\n')
            await client_writer.drain()
            return

        try:
            server_reader, server_writer = await asyncio.open_connection(
                host, port
            )
        except OSError as e:
            logger.error(f'CONNECT failed to {host}:{port}: {e}')
            client_writer.write(b'HTTP/1.1 502 Bad Gateway\r\n\r\n')
            await client_writer.drain()
            return

        client_writer.write(b'HTTP/1.1 200 Connection Established\r\n\r\n')
        await client_writer.drain()

        await asyncio.gather(
            self._pipe(client_reader, server_writer),
            self._pipe(server_reader, client_writer),
        )

    async def _handle_http(self, method, url, headers, client_reader, client_writer):
        """转发明文 HTTP 请求。"""
        parsed = urlparse(url)
        host = parsed.hostname
        port = parsed.port or 80

        # 在请求目标中保留查询字符串
        path = parsed.path or '/'
        if parsed.query:
            path += f'?{parsed.query}'

        try:
            server_reader, server_writer = await asyncio.open_connection(
                host, port
            )
        except OSError as e:
            logger.error(f'HTTP forward failed to {host}:{port}: {e}')
            client_writer.write(b'HTTP/1.1 502 Bad Gateway\r\n\r\n')
            await client_writer.drain()
            return

        # 将请求目标从绝对形式重写为原始形式
        request = f'{method} {path} HTTP/1.1\r\n'

        # 如果端口不是标准端口，Host 头必须包含端口号
        if port != 80:
            request += f'Host: {host}:{port}\r\n'
        else:
            request += f'Host: {host}\r\n'

        # 移除不应转发的 hop-by-hop 头
        hop_by_hop = {
            'proxy-authorization', 'proxy-connection',
            'connection', 'keep-alive', 'te', 'trailer', 'upgrade',
        }
        for key, value in headers.items():
            if key not in hop_by_hop:
                request += f'{key}: {value}\r\n'

        # 强制 Connection: close，使服务器不保持连接，
        # 否则响应流不会结束
        request += 'Connection: close\r\n\r\n'

        server_writer.write(request.encode('latin-1'))

        # 如果存在请求体则转发
        content_length = int(headers.get('content-length', 0))
        if content_length > 0:
            body = await client_reader.readexactly(content_length)
            server_writer.write(body)

        await server_writer.drain()

        # 将整个响应传回（而不是单次固定大小读取）
        while True:
            chunk = await server_reader.read(65536)
            if not chunk:
                break
            client_writer.write(chunk)
            await client_writer.drain()

        server_writer.close()
        await server_writer.wait_closed()

    async def _pipe(self, reader, writer):
        """带有正确半关闭处理的双向数据中继。"""
        try:
            while True:
                data = await reader.read(8192)
                if not data:
                    break
                writer.write(data)
                await writer.drain()
        except (ConnectionResetError, BrokenPipeError, OSError):
            pass
        finally:
            with contextlib.suppress(Exception):
                if writer.can_write_eof():
                    writer.write_eof()
```

有几个值得理解的协议细节。HTTP 头使用 ISO-8859-1（Latin-1）编码，而非 UTF-8。Latin-1 将每个字节值 0-255 映射到一个字符，因此 `decode('latin-1')` 永远不会抛出 `UnicodeDecodeError`，而 `decode('utf-8')` 在某些头部值上会崩溃。`Proxy-Authorization` 头使用 Base64 编码，但 Base64 不是加密：凭据以明文（或者更准确地说，可轻易还原的编码）传输，除非客户端与代理之间的连接本身受到 TLS 保护。hop-by-hop 头（`Connection`、`Keep-Alive`、`TE`、`Trailer`、`Upgrade`、`Proxy-Connection`）是用于两个节点之间直接连接的，不应端到端转发。RFC 9110 第 7.6.1 节要求代理在转发前将其剥离。

!!! warning "SSRF 风险"
    此实现不验证目标地址。客户端可以请求 `CONNECT 127.0.0.1:6379` 来访问本地 Redis 实例，或请求 `CONNECT 169.254.169.254:80` 来访问云实例元数据（AWS、GCP、Azure）。任何暴露给不受信任客户端的代理都必须针对私有和链路本地地址范围（`127.0.0.0/8`、`10.0.0.0/8`、`172.16.0.0/12`、`192.168.0.0/16`、`169.254.0.0/16`、`::1`、`fc00::/7`）建立拒绝列表来验证目标。

## SOCKS5 代理

SOCKS5 代理在比 HTTP 更低的层级运行。它使用 RFC 1928 中定义的二进制协议，包含三个阶段：方法协商、可选的认证和连接请求。代理完全不解析 HTTP。一旦隧道建立，它只是中继原始字节，不理解流经其中的是什么协议。

SOCKS5 的二进制特性意味着每次读取都必须精确接收预期数量的字节。TCP 是流协议，不保证 `read(4)` 返回 4 个字节：根据网络条件，它可能返回 1、2 或 3 个字节。下面的实现使用 asyncio 的 `readexactly()`，它在内部进行缓冲，直到请求数量的字节到达或连接关闭（抛出 `IncompleteReadError`）。

```python
import asyncio
import contextlib
import struct
import logging

logger = logging.getLogger(__name__)


class SOCKS5Proxy:
    """支持 CONNECT 和可选认证的异步 SOCKS5 代理（RFC 1928）。"""

    VERSION = 0x05

    def __init__(self, host='0.0.0.0', port=1080, username=None, password=None):
        self.host = host
        self.port = port
        self.username = username
        self.password = password

    async def start(self):
        server = await asyncio.start_server(
            self._handle_client, self.host, self.port
        )
        logger.info(f'SOCKS5 proxy listening on {self.host}:{self.port}')
        async with server:
            await server.serve_forever()

    async def _handle_client(self, reader, writer):
        try:
            if not await self._negotiate_method(reader, writer):
                return
            if self.username and not await self._authenticate(reader, writer):
                return
            await self._handle_request(reader, writer)
        except (asyncio.IncompleteReadError, ConnectionResetError):
            pass
        except Exception as e:
            logger.error(f'SOCKS5 error: {e}')
        finally:
            writer.close()
            await writer.wait_closed()

    async def _negotiate_method(self, reader, writer):
        """第一阶段：客户端提供认证方法，服务器选择一个。"""
        version = (await reader.readexactly(1))[0]
        if version != self.VERSION:
            return False

        nmethods = (await reader.readexactly(1))[0]
        methods = await reader.readexactly(nmethods)

        if self.username:
            if 0x02 not in methods:
                writer.write(bytes([self.VERSION, 0xFF]))
                await writer.drain()
                return False
            selected = 0x02
        else:
            selected = 0x00

        writer.write(bytes([self.VERSION, selected]))
        await writer.drain()
        return True

    async def _authenticate(self, reader, writer):
        """第二阶段：用户名/密码子协商（RFC 1929）。"""
        auth_ver = (await reader.readexactly(1))[0]
        if auth_ver != 0x01:
            return False

        ulen = (await reader.readexactly(1))[0]
        username = (await reader.readexactly(ulen)).decode('utf-8')
        plen = (await reader.readexactly(1))[0]
        password = (await reader.readexactly(plen)).decode('utf-8')

        ok = username == self.username and password == self.password
        writer.write(bytes([0x01, 0x00 if ok else 0x01]))
        await writer.drain()
        return ok

    async def _handle_request(self, reader, writer):
        """第三阶段：解析 CONNECT 请求并建立隧道。"""
        header = await reader.readexactly(4)
        version, command, _, atyp = header

        # 根据地址类型解析目标地址
        if atyp == 0x01:  # IPv4
            raw = await reader.readexactly(4)
            address = '.'.join(str(b) for b in raw)
        elif atyp == 0x03:  # Domain name
            length = (await reader.readexactly(1))[0]
            address = (await reader.readexactly(length)).decode('ascii')
        elif atyp == 0x04:  # IPv6
            raw = await reader.readexactly(16)
            groups = [f'{raw[i]:02x}{raw[i+1]:02x}' for i in range(0, 16, 2)]
            address = ':'.join(groups)
        else:
            await self._reply(writer, 0x08)
            return

        port = struct.unpack('!H', await reader.readexactly(2))[0]
        logger.info(f'SOCKS5 CONNECT {address}:{port}')

        if command != 0x01:  # Only CONNECT is implemented
            await self._reply(writer, 0x07)
            return

        try:
            server_reader, server_writer = await asyncio.open_connection(
                address, port
            )
        except ConnectionRefusedError:
            await self._reply(writer, 0x05)
            return
        except OSError:
            await self._reply(writer, 0x04)
            return

        # BND.ADDR 和 BND.PORT 应反映连接成功后的本地套接字地址。
        # 大多数客户端对 CONNECT 命令忽略这些字段，但正确填充
        # 满足 RFC 1928 的要求。
        local = server_writer.get_extra_info('sockname')
        await self._reply(writer, 0x00, local[0], local[1])

        await asyncio.gather(
            self._pipe(reader, server_writer),
            self._pipe(server_reader, writer),
        )

    async def _reply(self, writer, status, bind_addr='0.0.0.0', bind_port=0):
        """发送带有指定状态和绑定地址的 SOCKS5 回复。"""
        import socket
        try:
            packed_ip = socket.inet_aton(bind_addr)
            atyp = 0x01
        except OSError:
            packed_ip = socket.inet_aton('0.0.0.0')
            atyp = 0x01

        writer.write(bytes([
            self.VERSION, status, 0x00, atyp,
            *packed_ip,
            (bind_port >> 8) & 0xFF, bind_port & 0xFF,
        ]))
        await writer.drain()

    async def _pipe(self, reader, writer):
        try:
            while True:
                data = await reader.read(8192)
                if not data:
                    break
                writer.write(data)
                await writer.drain()
        except (ConnectionResetError, BrokenPipeError, OSError):
            pass
        finally:
            with contextlib.suppress(Exception):
                if writer.can_write_eof():
                    writer.write_eof()
```

当地址类型为 `0x03`（域名）时，代理通过 `asyncio.open_connection()` 自行解析 DNS。这是 SOCKS5 代理的核心隐私特性：客户端发送域名而不是在本地解析，从而防止 DNS 查询泄露到客户端的本地网络。这与 Chrome 配置 `--proxy-server=socks5://...` 时的行为相同，如[SOCKS 代理](./socks-proxies.md)中所述。

`_reply` 方法在成功连接后用实际的本地套接字地址填充 `BND.ADDR` 和 `BND.PORT`，这是 RFC 1928 的要求。许多 SOCKS5 实现在这里返回 `0.0.0.0:0`，因为大多数客户端对 CONNECT 命令忽略这些字段，但正确填充它们没有任何代价，还能避免协议违规。

## 同时运行两个代理

```python
async def main():
    http_proxy = HTTPProxy(
        port=8080, username='user', password='pass'
    )
    socks5_proxy = SOCKS5Proxy(
        port=1080, username='user', password='pass'
    )
    await asyncio.gather(http_proxy.start(), socks5_proxy.start())

# asyncio.run(main())
```

可以使用 curl 进行测试：

```bash
# HTTP proxy
curl -x http://user:pass@localhost:8080 http://httpbin.org/ip

# HTTPS through HTTP proxy (CONNECT tunnel)
curl -x http://user:pass@localhost:8080 https://httpbin.org/ip

# SOCKS5 proxy
curl --socks5 localhost:1080 --proxy-user user:pass https://httpbin.org/ip
```

## 代码未处理的内容

这些实现省略了生产代理需要处理的若干事项。理解缺少什么与理解已有什么同样具有教育意义。

没有连接限制。`asyncio.start_server` 无限制地接受连接，因此单个客户端打开数千个连接会耗尽文件描述符。生产代理使用信号量或连接池来限制并发数。

没有目标验证。两个代理都会连接到客户端请求的任何地址，包括 `127.0.0.1`、`169.254.169.254`（云元数据）和内部网络范围。这是一个服务端请求伪造（SSRF）向量。生产代理维护私有和链路本地地址范围的拒绝列表。

没有流量日志或指标。生产代理跟踪请求数量、传输字节数、错误率和延迟百分位数，通常导出到 Prometheus 或类似系统。

HTTP 代理没有添加 `Via` 头。RFC 9110 第 7.6.3 节要求中间节点在转发消息时附加 `Via` 字段。为了简洁起见这里省略了，但符合标准的代理必须包含它。

两个代理都没有实现优雅关闭。当服务器停止时，活跃的隧道会被突然终止，而不是被排空。生产代理跟踪活跃连接并等待它们完成（有截止时间），然后才关闭。

## 代理链

代理链是指将流量依次通过多个代理路由：客户端到代理 A，代理 A 到代理 B，代理 B 到目标服务器。链中的每个代理只知道其直接邻居，而非完整路径。

主要用例是分散信任。如果你不完全信任任何单一代理提供商，将两个提供商链接在一起意味着没有一个能同时看到你的真实 IP 和你的目标地址。代价是延迟：每一跳都会增加自己的连接建立时间和转发延迟。单个代理通常增加 50 到 100ms 的开销。两个代理大约翻倍，三个代理可以使总开销超过 300ms。

超过两跳后，边际隐私收益递减，而延迟和故障概率增加。大多数实际部署使用一到两个代理。Tor 使用三个中继节点（守卫节点、中间节点、出口节点），因为其威胁模型假设某些中继节点已被入侵，但 Tor 将延迟惩罚视为明确的设计权衡。

```
Client --> Proxy A (SOCKS5) --> Proxy B (SOCKS5) --> Target
           sees: client IP          sees: Proxy A IP
           sees: Proxy B addr       sees: target addr
```

通过另一个 SOCKS5 代理链接 SOCKS5 代理的工作方式是让代理 A 将代理 B 视为目标。客户端连接到代理 A 并发送指向代理 B 地址的 CONNECT 请求。一旦该隧道建立，客户端通过隧道发送第二次 SOCKS5 握手，这次请求真正的目标。代理 A 看到流向代理 B 的流量，但如果内部连接已加密，则无法读取其内容。

## 参考资料

- RFC 1928: SOCKS Protocol Version 5 - https://datatracker.ietf.org/doc/html/rfc1928
- RFC 1929: Username/Password Authentication for SOCKS V5 - https://datatracker.ietf.org/doc/html/rfc1929
- RFC 9110: HTTP Semantics - https://www.rfc-editor.org/rfc/rfc9110.html
- RFC 9112: HTTP/1.1 - https://www.rfc-editor.org/rfc/rfc9112.html
- OWASP SSRF Prevention Cheat Sheet - https://cheatsheetseries.owasp.org/cheatsheets/Server_Side_Request_Forgery_Prevention_Cheat_Sheet.html
- mitmproxy (Python HTTPS intercepting proxy) - https://mitmproxy.org/


================================================
FILE: docs/zh/deep-dive/network/http-proxies.md
================================================
# HTTP/HTTPS Proxy 架构

HTTP proxy 是互联网上最常见的代理协议。几乎每个企业网络都在使用它们，大多数商业代理服务也将其作为默认选项。它们在 OSI 模型的第 7 层（应用层）运行，这意味着它们能够理解 HTTP，并可以解析、修改、缓存和过滤流量。然而，这种与协议的深度集成也是它们最大的局限：它们只能处理 HTTP 流量，会通过可识别的标头暴露代理的使用，并且无法代理 UDP，导致 WebRTC 和 DNS 容易泄露。

本文档涵盖 HTTP proxy 在协议层面的工作原理、用于 HTTPS 隧道的 CONNECT 方法、身份验证机制，以及 HTTP/2 和 HTTP/3 等现代协议的影响。

!!! info "模块导航"
    - [网络基础](./network-fundamentals.md)：TCP/IP、UDP、OSI 模型
    - [网络与安全概述](./index.md)：模块介绍
    - [SOCKS Proxy](./socks-proxies.md)：协议无关的替代方案
    - [Proxy 检测](./proxy-detection.md)：如何避免被检测

    有关实际配置，请参阅 [Proxy 配置](../../features/configuration/proxy.md)。

## HTTP Proxy 的工作原理

HTTP proxy 位于客户端和目标服务器之间，维护两个独立的 TCP 连接：一个从客户端到 proxy，另一个从 proxy 到目标服务器。由于 proxy 理解 HTTP，它可以对经过的流量做出智能决策。

### 请求流程

当客户端配置为使用 HTTP proxy 时，它会将完整的 HTTP 请求发送到 proxy，而不是直接发送到目标服务器。与直接请求的关键区别在于，请求行包含绝对 URI，而不仅仅是路径。例如，客户端发送的不是 `GET /page HTTP/1.1`，而是 `GET http://example.com/page HTTP/1.1`。这告诉 proxy 应将请求转发到哪里。

```mermaid
sequenceDiagram
    participant Client as Client Browser
    participant Proxy as HTTP Proxy
    participant Server as Target Server

    Client->>Proxy: GET http://example.com/page HTTP/1.1<br/>Host: example.com<br/>User-Agent: Mozilla/5.0
    Note over Client,Proxy: TCP connection #1

    Note over Proxy: Parse request, check auth,<br/>check cache, apply rules

    Proxy->>Server: GET /page HTTP/1.1<br/>Host: example.com<br/>Via: 1.1 proxy.example.com<br/>X-Forwarded-For: 192.168.1.100
    Note over Proxy,Server: TCP connection #2

    Server->>Proxy: HTTP/1.1 200 OK<br/>[response body]

    Note over Proxy: Cache response if allowed,<br/>filter content, log transaction

    Proxy->>Client: HTTP/1.1 200 OK<br/>Via: 1.1 proxy.example.com<br/>[possibly modified body]
```

Proxy 接收到完整的 HTTP 请求后，会解析方法、URL 和标头，然后决定如何处理。它可能会检查身份验证凭据、根据访问控制列表验证 URL、查找资源的缓存副本，并在转发前修改标头。然后它会打开一个到目标服务器的独立 TCP 连接并发送请求，可能带有修改过的标头。

当响应到达时，proxy 可以根据 HTTP 语义（`Cache-Control`、`ETag`）缓存响应，过滤恶意软件或被拦截的关键词，在客户端支持时进行压缩，并在将响应转发回客户端之前记录事务。

### Proxy 标头与隐私

HTTP proxy 通常会添加标头来暴露它们的存在以及客户端的真实 IP 地址。`Via` 标头（RFC 9110）标识请求链中的 proxy。`X-Forwarded-For` 标头包含原始客户端 IP，如果涉及多个 proxy 则会形成链。`X-Forwarded-Proto` 标头指示原始请求是 HTTP 还是 HTTPS。一些 proxy 还会添加 `X-Real-IP` 作为 `X-Forwarded-For` 的简化替代。

还有一个标准化的 `Forwarded` 标头（RFC 7239），将所有这些信息整合到一个字段中，例如 `Forwarded: for=192.168.1.100;proto=http;by=proxy.example.com`。实际上，大多数 proxy 仍然使用 `X-Forwarded-*` 变体，因为它们有更广泛的支持。

旧版客户端和一些老旧浏览器在通过 proxy 路由时，可能还会发送 `Proxy-Connection: keep-alive` 标头而非 `Connection: keep-alive`。这个标头是一个众所周知的 proxy 使用指标，也是经典的检测信号。

!!! danger "标头检测"
    检测系统会查找 `Via`、`X-Forwarded-For` 或 `Forwarded` 标头的存在来确认 proxy 的使用。如果 `X-Real-IP` 与连接 IP 不匹配，则可以确认使用了 proxy。高级 proxy 可以剥离这些标头，但许多商业 proxy 服务默认会保留它们。请务必使用 [browserleaks.com/ip](https://browserleaks.com/ip) 等工具验证你的 proxy 行为。

### 能力与限制

由于 HTTP proxy 能够解析和理解 HTTP 协议，它们可以读取和修改未加密 HTTP 请求和响应的每个部分：URL、标头、Cookie 和正文。这使它们能够智能缓存响应、按 URL 或关键词过滤内容、注入或剥离标头、验证用户身份，以及详细记录所有流量。

代价是与 HTTP 的深度耦合意味着 proxy 仅限于 HTTP 流量。它无法原生代理 FTP、SSH、SMTP 或自定义协议（尽管下面描述的 CONNECT 方法为任何基于 TCP 的协议提供了隧道解决方案）。它不支持 UDP，这意味着 WebRTC、DNS 查询和 QUIC/HTTP/3 流量会完全绕过它。而检查 HTTPS 内容需要 TLS 终止，这会破坏端到端加密。

## CONNECT 方法：HTTPS 隧道

CONNECT 方法（RFC 9110，第 9.3.6 节）解决了一个根本问题：HTTP proxy 如何转发它无法读取的加密流量？答案是成为一个盲目的 TCP 隧道。

当客户端想要通过 proxy 访问 HTTPS 站点时，它会发送一个 `CONNECT` 请求，要求 proxy 建立到目标的原始 TCP 连接。一旦 proxy 确认隧道已建立，它就不再是 HTTP proxy，而是变成第 4 层的透明 TCP 中继，在两个方向上转发字节而不解释它们。

```mermaid
sequenceDiagram
    participant Client
    participant Proxy
    participant Server

    Client->>Proxy: CONNECT example.com:443 HTTP/1.1<br/>Host: example.com:443<br/>Proxy-Authorization: Basic dXNlcjpwYXNz
    Note over Client,Proxy: Unencrypted HTTP request

    Proxy->>Server: TCP three-way handshake
    Note over Proxy,Server: TCP connection established

    Proxy->>Client: HTTP/1.1 200 Connection Established

    Note right of Proxy: Proxy is now a transparent<br/>TCP relay (Layer 4)

    Client->>Server: TLS ClientHello
    Note over Client,Server: TLS handshake (proxy sees<br/>this in plaintext)
    Server->>Client: TLS ServerHello, Certificate

    Client->>Server: Encrypted HTTP/2 request
    Server->>Client: Encrypted HTTP/2 response

    Note over Proxy: Proxy blindly forwards<br/>all encrypted data
```

### CONNECT 请求

CONNECT 请求非常简洁。方法是 `CONNECT`，请求 URI 是目标的 `host:port`（而不是路径），如果 proxy 需要则包含身份验证。没有请求体。Proxy 验证凭据，检查访问控制规则，然后打开到指定主机和端口的 TCP 连接。如果一切成功，它会返回 `HTTP/1.1 200 Connection Established`，后跟一个空行。在该空行之后，HTTP 对话结束，proxy 变成透明中继。

### CONNECT 之后的可见性

一旦隧道建立，proxy 的可见性就很有限了。它知道来自 CONNECT 请求的目标主机名和端口。它可以观察连接时间（何时建立以及持续多久）、每个方向传输的数据量，以及任一方终止连接的时刻。它还可以观察随后的 TLS 握手，这一点特别值得关注。

TLS ClientHello 消息在隧道建立后立即发送，且以明文传输。Proxy（以及任何网络观察者）可以直接读取 TLS 版本、完整的支持密码套件列表、扩展及其参数、提供的椭圆曲线，以及包含目标主机名的 SNI（Server Name Indication）扩展。这正是用于 TLS 指纹识别（JA3/JA4）的信息。详情请参阅[网络指纹](../fingerprinting/network-fingerprinting.md)。

Proxy 无法看到的是加密的应用数据：HTTP 方法、URL、请求和响应标头、Cookie、会话令牌和响应内容都在 TLS 隧道内加密。

!!! note "SNI 与 Encrypted Client Hello (ECH)"
    ClientHello 中的 SNI 扩展以明文暴露目标主机名，这在 proxy 场景中与 CONNECT 请求是冗余的，但对其他网络观察者来说很有意义。Encrypted Client Hello (ECH) 目前正在部署中，旨在加密 SNI 来解决这一泄露问题。不过，ECH 的采用仍然有限，需要客户端和服务器双方的支持。

### CONNECT 用于非 HTTPS 协议

虽然 CONNECT 主要用于 HTTPS，但它可以隧道传输任何基于 TCP 的协议。到端口 993 的 IMAPS 连接、到端口 22 的 SSH 连接，或到端口 990 的 FTP-over-TLS 都可以通过 CONNECT 隧道工作。Proxy 不需要理解这些协议，因为隧道建立后它只是简单地中继字节。

实际上，许多企业 proxy 会将 CONNECT 限制在端口 443（HTTPS），以防止滥用。尝试 `CONNECT example.com:22` 进行 SSH 连接通常会返回 `403 Forbidden`。

### HTTPS 困境

HTTP proxy 在处理加密流量时面临一个根本性的选择。使用 CONNECT 隧道方式，端到端加密得以保留，客户端直接验证服务器证书，证书固定正常工作。但 proxy 无法检查、缓存或过滤加密内容。

另一种方式是 TLS 终止（MITM），proxy 解密 HTTPS 流量、检查内容，然后重新加密后转发。这需要在客户端上安装 proxy 的 CA 证书，会破坏端到端加密，并且可以通过证书固定和证书透明度日志检测到。大多数企业 proxy 使用这种方式进行内容过滤和安全扫描，而注重隐私的 proxy 则使用盲目 CONNECT 隧道。

对于网页抓取和自动化来说，这一区别对 TLS 指纹识别很重要。如果 proxy 执行 TLS 终止，目标服务器看到的 TLS 指纹属于 proxy，而非你的浏览器。如果你使用的是 CONNECT 隧道，指纹则是端到端保留的。根据你的规避策略，其中一种方式可能比另一种更合适。

| 方面 | HTTP（无 CONNECT） | HTTPS（CONNECT 隧道） |
|--------|-------------------|------------------------|
| Proxy 可见性 | 完整的 HTTP 请求/响应 | 仅目标 host:port + TLS ClientHello |
| 加密 | 无（除非 TLS 终止） | 端到端 TLS |
| 缓存 | 是，基于 HTTP 语义 | 否（加密内容） |
| 内容过滤 | 是 | 否（仅基于主机名拦截） |
| 标头修改 | 是 | 否（加密标头） |
| URL 可见性 | 完整 URL | 仅主机名（通过 CONNECT 和 SNI） |
| 协议支持 | 仅 HTTP | 任何基于 TCP 的协议 |

## HTTPS Proxy（到 Proxy 的 TLS）

有一个值得澄清的区别：代理 HTTPS 流量与通过 HTTPS 连接到 proxy 本身是不同的。当你配置 `--proxy-server=https://proxy:port` 而非 `http://proxy:port` 时，你的浏览器与 proxy 之间的连接是通过 TLS 加密的。这可以保护你的 proxy 身份验证凭据不被本地网络嗅探，并且对本地观察者隐藏 CONNECT 主机名，因为它被封装在到 proxy 的 TLS 连接内。

Chrome 通过 `--proxy-server` 中的 `https://` 方案支持此功能。当在不受信任的网络（公共 Wi-Fi、共享主机）上使用 proxy 时，这一点尤其重要，因为你与 proxy 之间的连接是最薄弱的环节。

## 身份验证

HTTP proxy 身份验证使用标准 HTTP 状态码和标头，遵循 RFC 9110。当 proxy 需要身份验证时，它会返回 `407 Proxy Authentication Required` 以及一个 `Proxy-Authenticate` 标头，指示它支持哪些身份验证方案。然后客户端使用包含凭据的 `Proxy-Authorization` 标头重新传输请求。

### 身份验证方案

有多种身份验证方案，每种都有不同的安全特性。

**Basic**（RFC 7617）是最简单的。客户端发送 `Proxy-Authorization: Basic <base64(username:password)>`。Base64 是一种编码而非加密，因此凭据可以被轻易还原。任何拦截到该标头的人都可以立即解码并无限期地重用，因为没有重放保护。Basic 身份验证应仅通过 TLS 加密的连接使用。

**Digest**（RFC 7616）使用挑战-响应机制。Proxy 发送一个随机 nonce，客户端计算用户名、密码、nonce 和请求 URI 的哈希值。密码永不传输，nonce 提供重放保护。原始版本使用 MD5，其速度足以被高效暴力破解，不过 RFC 7616 增加了 SHA-256 支持。Digest 身份验证很少被现代 proxy 服务实现。

**NTLM** 是微软专有的挑战-响应协议，常见于 Windows 企业环境。它使用三步协商（Type 1 协商、Type 2 挑战、Type 3 认证），并与 Active Directory 集成实现单点登录。NTLMv1 使用 DES（已被攻破），NTLMv2 使用 HMAC-MD5（按现代标准被认为较弱）。微软建议在新部署中使用 Kerberos 替代 NTLM。NTLM 是绑定连接的，这意味着它在 HTTP/2 多路复用下会出问题。

**Negotiate**（RFC 4559）使用 SPNEGO 在 Kerberos 和 NTLM 之间选择，优先使用 Kerberos。Kerberos 提供最强的安全性（AES 加密、相互身份验证、有时间限制的票据），但需要 Active Directory 基础设施、加入域的机器和精确的时钟同步。在浏览器自动化中，Kerberos 难以通过编程方式配置。

| 方案 | 安全性 | 机制 | 实用说明 |
|--------|----------|-----------|-----------------|
| Basic | 低 | Base64 编码的凭据 | 通用支持。仅通过 TLS 使用。 |
| Digest | 中 | 使用 MD5/SHA-256 的挑战-响应 | 通过 nonce 提供重放保护。很少被实现。 |
| NTLM | 中 | 挑战-响应（NT 哈希） | Windows SSO。专有，存在已知漏洞。 |
| Negotiate | 高 | Kerberos/SPNEGO | 最强。需要 Active Directory。 |

### Pydoll 中的身份验证

Chrome 不支持在 `--proxy-server` 标志中内联 proxy 凭据。写 `--proxy-server=http://user:pass@proxy:port` 不会生效：Chrome 会静默忽略 `user:pass` 部分并在不进行身份验证的情况下连接。

Pydoll 通过其 `ProxyManager` 透明地解决了这个问题。当你提供带有内嵌凭据的 proxy URL 时，Pydoll 会提取用户名和密码，在传递给 Chrome 之前从 URL 中剥离它们，然后使用 CDP Fetch 域拦截 `407 Proxy Authentication Required` 响应，并通过 `Fetch.continueWithAuth` 自动提供凭据。这种方式适用于 Chrome 支持的所有身份验证方案（Basic、Digest、NTLM、Negotiate），而无需 Pydoll 实现特定于协议的逻辑。

```python
from pydoll.browser import Chrome
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
# Pydoll extracts credentials, cleans the URL, and handles 407 via CDP
options.add_argument('--proxy-server=http://user:pass@proxy.example.com:8080')

async with Chrome(options=options) as browser:
    tab = await browser.start()
    await tab.go_to('https://example.com')
```

!!! tip "身份验证最佳实践"
    始终使用 TLS 加密的 proxy 连接（HTTPS proxy 或 SSH 隧道）来保护传输中的凭据。对于 API proxy，优先使用 Bearer 令牌，因为它们可撤销且有时间限制。切勿通过未加密的 HTTP 连接使用 Basic 身份验证。不要在源代码中硬编码凭据，请使用环境变量。

## 现代协议与代理

### HTTP/2

HTTP/2 引入了多路复用、二进制分帧和 HPACK 标头压缩，从根本上改变了 proxy 处理连接的方式。在 HTTP/1.1 中，每个请求按顺序占用一个连接（虽然存在流水线但实际上已被禁用，因此浏览器通过为每个主机打开六个并行连接来解决这个问题）。在 HTTP/2 中，单个 TCP 连接承载多个并发流，每个流都有自己的请求和响应。

对于 proxy 来说，这意味着需要在连接的两端管理流 ID、优先级和流控窗口。Proxy 必须在客户端侧和服务器侧之间转换流 ID、维护优先级树，并对每个流进行流量控制。这比 HTTP/1.1 简单的请求-响应转发要复杂得多。

从指纹识别的角度来看，HTTP/2 流元数据（窗口大小、优先级设置、HPACK 内的标头排序）可以对单个客户端进行指纹识别，即使多个用户共享同一个 proxy。

| 特性 | HTTP/1.1 | HTTP/2 |
|---------|----------|--------|
| 连接 | 每个连接按顺序处理（浏览器并行打开 6 个） | 单个连接上的多个并发流 |
| 多路复用 | 否（队头阻塞） | 是（仅流级别） |
| 标头压缩 | 无 | HPACK |
| Proxy 复杂度 | 简单的请求/响应转发 | 流 ID 映射、优先级管理 |

在 HTTP/2 中，CONNECT 方法通过 RFC 8441 进行了扩展，支持 `:protocol` 伪标头，使 WebSocket 隧道和其他协议升级可以直接在 HTTP/2 流中进行，而无需单独的连接。

### HTTP/3 与 QUIC

HTTP/3 运行在 QUIC（RFC 9000）之上，这是一种基于 UDP 的传输协议。这给 HTTP proxy 带来了根本性的挑战。传统 HTTP proxy 运行在 TCP 之上，无法处理 QUIC 的 UDP 流量。QUIC 连接可以在 IP 变化后继续存活（连接迁移），使 proxy 会话管理变得复杂。而且 QUIC 几乎加密了所有内容，包括之前可见的传输层元数据。

代理 QUIC 需要 CONNECT-UDP（RFC 9298），这是一种通过 HTTP proxy 建立 UDP 隧道的新方法。大多数传统 proxy，包括许多商业服务，尚不支持此功能。当 proxy 不支持 QUIC 时，浏览器会回退到基于 TCP 的 HTTP/2，这意味着如果你依赖 HTTP/3 的加密传输，实际泄露的元数据可能比预期更多。

在自动化场景中，考虑使用 `--disable-quic` Chrome 标志禁用 QUIC，以强制使用基于 TCP 的 HTTP/2。这可以确保所有流量都通过你的 proxy，并消除 QUIC 导致的 UDP 泄露风险。

| 方面 | TCP + TLS（HTTP/1.1、HTTP/2） | QUIC/UDP（HTTP/3） |
|--------|------------------------------|-------------------|
| 传输 | TCP（面向连接） | UDP（无连接） |
| 握手 | 分离的 TCP + TLS（2 RTT） | 合并（0-1 RTT） |
| 队头阻塞 | 是（TCP 级别） | 否（仅流级别） |
| 连接迁移 | 不支持 | 支持（可在 IP 变化后存活） |
| Proxy 兼容性 | 极好 | 有限（需要 UDP 中继支持） |

!!! warning "协议降级"
    当 proxy 不支持 HTTP/3 时，浏览器会静默回退到 HTTP/2 或 HTTP/1.1。这种降级可能暴露 HTTP/3 本会加密的元数据（标头、时序模式）。请监控你的流量以了解实际的协议版本，并注意 HTTP/3 的采用率因地区和 CDN 而异。

## 总结

HTTP proxy 提供了丰富的功能，但代价是范围有限和隐私问题。它们可以检查、缓存和过滤 HTTP 流量，但无法处理非 HTTP 协议、UDP 流量或 HTTPS 内容（除非破坏加密）。除非明确剥离，否则它们的存在会通过可识别的标头暴露。

对于自动化来说，CONNECT 隧道是最相关的功能：它在保留端到端 TLS 加密的同时，仅让 proxy 获得主机名级别的可见性。Pydoll 通过 CDP Fetch 域透明地处理 proxy 身份验证，支持 Chrome 实现的所有方案。

### HTTP Proxy 与 SOCKS5 对比

| 需求 | HTTP Proxy | SOCKS5 |
|------|------------|--------|
| 内容过滤 | 是 | 否 |
| 基于 URL 拦截 | 是 | 否（仅 IP:port） |
| 缓存 | 是 | 否 |
| UDP 支持 | 否 | 是 |
| 协议灵活性 | 仅 HTTP（CONNECT 可用于 TCP 隧道） | 任何 TCP/UDP |
| 隐私 | 低（解析 HTTP，添加暴露性标头） | 中（不解析或修改流量，但未加密内容对运营商仍然可见） |
| DNS 解析 | Proxy 解析（远程） | 取决于配置（SOCKS5：通常客户端解析，SOCKS5h：proxy 解析。Chrome 对 SOCKS5 始终使用远程解析。） |

对于需要内容控制和缓存的企业环境，HTTP proxy 是正确的选择。对于注重隐私的自动化，SOCKS5 提供更好的隐蔽性和协议灵活性。要获得最高安全性，请使用 SOCKS5 over SSH 隧道或 VPN。

**后续步骤：**

- [SOCKS Proxy](./socks-proxies.md)：协议无关的会话层代理
- [网络基础](./network-fundamentals.md)：TCP/IP、UDP、WebRTC
- [Proxy 检测](./proxy-detection.md)：如何检测 proxy 以及如何避免
- [Proxy 配置](../../features/configuration/proxy.md)：Pydoll 实际 proxy 设置
- [网络指纹](../fingerprinting/network-fingerprinting.md)：TCP/IP 和 TLS 指纹识别

## 参考文献

- RFC 9110: HTTP Semantics (2022, replaces RFC 7230-7237) - https://www.rfc-editor.org/rfc/rfc9110.html
- RFC 9112: HTTP/1.1 (2022) - https://www.rfc-editor.org/rfc/rfc9112.html
- RFC 9113: HTTP/2 (2022, replaces RFC 7540) - https://www.rfc-editor.org/rfc/rfc9113.html
- RFC 9114: HTTP/3 (2022) - https://www.rfc-editor.org/rfc/rfc9114.html
- RFC 9000: QUIC Transport Protocol (2021) - https://www.rfc-editor.org/rfc/rfc9000.html
- RFC 9298: Proxying UDP in HTTP (CONNECT-UDP, 2022) - https://www.rfc-editor.org/rfc/rfc9298.html
- RFC 8441: Bootstrapping WebSockets with HTTP/2 (2018) - https://www.rfc-editor.org/rfc/rfc8441.html
- RFC 7617: Basic Authentication (2015) - https://www.rfc-editor.org/rfc/rfc7617.html
- RFC 7616: Digest Authentication (2015) - https://www.rfc-editor.org/rfc/rfc7616.html
- RFC 7239: Forwarded HTTP Extension (2014) - https://www.rfc-editor.org/rfc/rfc7239.html
- RFC 4559: Negotiate Authentication (2006) - https://www.rfc-editor.org/rfc/rfc4559.html
- MDN Web Docs: Proxy servers and tunneling - https://developer.mozilla.org/en-US/docs/Web/HTTP/Proxy_servers_and_tunneling
- Chrome DevTools Protocol: Fetch domain - https://chromedevtools.github.io/devtools-protocol/tot/Fetch/


================================================
FILE: docs/zh/deep-dive/network/index.md
================================================
# 网络与安全深度探讨

**欢迎来到现代互联网通信的基础——这里是匿名、检测与规避的战场。**

网络协议是驱动每一次 Web 请求、浏览器连接和自动化脚本的无形基础设施。深入理解它们，您将从一个 **工具使用者** 转变为一个 **协议工程师**，能够应对最复杂的反机器人系统。

## 为什么网络架构很重要

当您运行 `tab.go_to('https://example.com')` 时，一场复杂的协议交响乐便拉开了序幕：

1.  **DNS 解析** 将域名转换为 IP 地址（可能会泄露您的意图）
2.  **TCP 握手** 建立连接（通过数据包特征暴露您的操作系统）
3.  **TLS 协商** 保护通道安全（通过密码套件对您的浏览器进行指纹识别）
4.  **HTTP/2 请求** 获取页面（通过 SETTINGS 帧暴露浏览器版本）
5.  **WebRTC 发现** 可能会探测您的真实 IP（完全绕过您的 VPN）

**每一步都是检测或规避的机会。**

!!! danger "网络层无法说谎"
    与浏览器级特征（JavaScript 可以修改）不同，网络级指纹被 **烙印在操作系统内核和 TCP/IP 协议栈中**。像 Chrome 浏览器声称自己是 Windows，却发送 Linux 的 TCP 选项，这种不匹配对于隐形自动化来说是立竿见影的致命伤。

## 互联网隐私的架构

本模块探讨了在现代互联网上使隐私成为可能（或被破坏）的 **技术基础**：

### OSI 模型的现实

```mermaid
graph TB
    subgraph "应用层 (第 7 层)"
        HTTP[HTTP/HTTPS 标头]
        DNS[DNS 查询]
    end
    
    subgraph "表示层 (第 6 层)"
        TLS[TLS/SSL 指纹]
        Ciphers[密码套件, 扩展]
    end
    
    subgraph "会话/传输层 (第 5-4 层)"
        SOCKS[SOCKS 代理协议]
        TCP[TCP 窗口, 选项, ISN]
    end
    
    subgraph "网络层 (第 3 层)"
        IP[IP TTL, 分片]
        Routing[数据包路由, 跳数]
    end
    
    HTTP --> TLS
    DNS --> TLS
    TLS --> SOCKS
    Ciphers --> TCP
    SOCKS --> IP
    TCP --> Routing
```

**每一层既是盾牌，也是弱点：**

- **第 7 层 (应用层)**：代理可以读取和修改您的 HTTP 流量
- **第 6 层 (表示层)**：TLS 加密保护内容，但泄露元数据
- **第 4 层 (传输层)**：TCP 特征暴露您的操作系统
- **第 3 层 (网络层)**：IP 地址揭示您的物理位置

## 您将掌握什么

本模块按照从基础到高级利用的 **技术进阶** 构建：

### 1. 网络基础
**[网络基础](./network-fundamentals.md)**

构建基础：了解驱动互联网的协议，以及它们如何揭示或隐藏您的身份。

- **OSI 模型分层** 及其指纹识别含义
- **TCP vs UDP**：为什么您的代理可能会泄露 UDP 流量
- **WebRTC IP 泄露**：现代浏览器中的隐藏威胁
- **网络堆栈特征**：TTL、窗口大小、选项顺序

**为什么从这里开始**：没有这个基础，代理配置就是 **“货物崇拜编程”**，只是复制命令而不理解它们为什么有效（或无效）。

### 2. HTTP/HTTPS 代理
**[HTTP/HTTPS 代理](./http-proxies.md)**

掌握最常见的代理协议，并理解其根本局限性。

- **HTTP 代理操作**：请求转发、缓存、标头注入
- **CONNECT 隧道**：HTTPS 如何“隧道”通过 HTTP 代理
- **HTTP/2 的复杂性**：多路复用、流优先级、SETTINGS 指纹
- **HTTP/3 和 QUIC**：基于 UDP 的代理挑战
- **身份验证方案**：Basic, Digest, NTLM, Bearer 令牌

**关键见解**：HTTP 代理在第 7 层运行，它们可以 **读取、修改和记录** 您未加密的流量。要获得真正的隐私，您需要在代理看到您的数据 **之前** 进行加密。

### 3. SOCKS 代理
**[SOCKS 代理](./socks-proxies.md)**

理解为什么 SOCKS5 是注重隐私的自动化的 **黄金标准**。

- **SOCKS4 vs SOCKS5**：协议演进和功能
- **SOCKS5 握手**：二进制协议深度解析与数据包结构
- **UDP 支持**：通过 SOCKS5 运行游戏、VoIP 和 WebRTC
- **DNS 解析**：为什么代理端 DNS 能防止泄露
- **为什么 SOCKS5 > HTTP 代理**：协议级比较

**关键优势**：SOCKS 在第 5 层（会话层）运行，**低于** 应用层。它无法读取您的 HTTP 流量，只能看到目标 IP，从而极大地减少了信任面。

### 4. 代理检测
**[代理检测与匿名](./proxy-detection.md)**

了解网站如何 **检测代理使用** 以及如何规避检测。

- **匿名级别**：透明代理、匿名代理、精英代理
- **IP 信誉数据库**：您数据中心的 IP 如何暴露您
- **标头分析**：X-Forwarded-For, Via, Forwarded 标头
- **一致性检查**：DNS 反向查找、地理位置不匹配
- **网络指纹集成**：将代理检测与 TCP/TLS 分析相结合

**残酷的现实**：大多数“匿名”代理都很容易被检测到。真正的隐蔽需要 **精英住宅代理** + **一致的浏览器指纹** + **类人行为**。

### 5. 构建代理服务器
**[构建您自己的代理](./build-proxy.md)**

在 Python 中从头开始实现 HTTP 和 SOCKS5 代理，这是终极的学习体验。

- **HTTP 代理服务器**：带身份验证的完整异步实现
- **SOCKS5 代理服务器**：二进制协议处理、TCP 隧道
- **代理链**：分层匿名（以及延迟权衡）
- **旋转代理池**：健康检查、故障转移、负载均衡
- **高级主题**：透明代理、MITM SSL 拦截

**为什么要构建自己的**：了解实现细节可以揭示从外部看不到的 **攻击向量** 和 **优化机会**。

### 6. 法律与道德考量
**[法律与道德准则](./proxy-legal.md)**

驾驭代理使用和网络自动化的法律雷区。

- **法规遵从**：GDPR, CFAA, 国际法律
- **服务条款**：什么构成违规
- **道德准则**：robots.txt, 速率限制, 透明度
- **案例研究**：法律先例 (hiQ vs LinkedIn, QVC vs Resultly)
- **何时避免使用代理**：高风险场景

**免责声明**：这是 **教育信息**，不是法律建议。法律因司法管辖区和用例而异。请咨询合格的法律顾问。

## 代理悖论

关于代理，有一个令人不安的事实：

!!! warning "代理不会让你匿名。它们让你 **与众不同**"
    代理会更改您的 IP 地址，但它也会：
    
    - 增加 **延迟**（可通过计时分析检测）
    - 重置 **TTL** 值（暴露代理跳数）
    - 引入 **TCP 指纹** 不匹配（代理操作系统 ≠ 您的操作系统）
    - 可能注入 **标头** (X-Forwarded-For, Via)
    - 造成 **地理位置** 不一致（浏览器时区 ≠ IP 位置）
    
    代理是一种 **工具**，而不是一个解决方案。真正的隐蔽需要 **全面的一致性**。

## 先决条件

这是 **高级材料**。您应该熟悉：

- 基本网络概念（IP 地址、端口、协议）
- TCP/IP 基础（三次握手、数据包、路由）
- 异步 Python 编程 (asyncio, async/await)
- Pydoll 基础知识 (参见 [核心概念](../../features/core-concepts.md))

**如果您对网络不熟悉**，我们强烈建议您：

1.  首先阅读 TCP/IP 基础指南
2.  尝试使用 Wireshark 来可视化网络流量
3.  在运行数据包捕获的同时尝试代码示例
4.  构建代理服务器并在本地测试它们

## 与其他模块的集成

网络架构并非孤立存在。它与以下内容深度集成：

- **[指纹识别](../fingerprinting/network-fingerprinting.md)**：TCP/IP 和 TLS 特征如何识别您
- **[浏览器配置](../../features/configuration/browser-preferences.md)**：使浏览器行为与代理特征保持一致
- **[连接层](../fundamentals/connection-layer.md)**：Pydoll 如何通过代管理 WebSocket 连接

## 学习路径

我们推荐以下进阶路径：

**阶段 1：基础**
1.  阅读 [网络基础](./network-fundamentals.md)
2.  理解 OSI 模型和协议分层
3.  了解 WebRTC 泄露和 UDP 隧道

**阶段 2：协议深度探讨**
4.  学习 [HTTP/HTTPS 代理](./http-proxies.md)
5.  掌握 [SOCKS 代理](./socks-proxies.md)
6.  比较协议并理解权衡

**阶段 3：对抗性思维**
7.  探索 [代理检测](./proxy-detection.md)
8.  从防御者的角度学习检测技术
9.  应用规避策略

**阶段 4：动手实践**
10. 从 [构建代理](./build-proxy.md) 构建代理服务器
11. 使用 Wireshark 捕获和分析流量
12. 测试代理链和轮换策略

**阶段 5：操作安全**
13. 查看 [法律与道德](./proxy-legal.md) 准则
14. 理解合规性要求
15. 制定负责任的自动化策略


## 理念

网络和安全知识是 **基础性的力量**。与特定框架的技能（会过时）不同，协议知识是 **永恒的**：

- TCP 自 RFC 793 (1981) 以来没有根本改变
- TLS 建立在 SSL (1995) 的概念之上
- HTTP/2 (2015) 和 HTTP/3 (2022) 是演进，而不是革命

一次掌握这些概念，您将在职业生涯的剩余时间里理解您遇到的 **每一个基于网络的系统**。

## 道德承诺

在继续之前，请确认：

我理解代理可用于合法和恶意目的
我将尊重网站的服务条款和 robots.txt
我将实现速率限制和友好的爬行
我不会将此知识用于欺诈、滥用或非法活动
当不确定合规性时，我将咨询法律顾问

**能力越大，责任越大。** 请明智地使用这些知识。

---

## 准备好开始了吗？

从 **[网络基础](./network-fundamentals.md)** 开始您的旅程，以构建基础，然后按顺序浏览各个模块。每个文档都建立在“前一个”文档的基础之上，从而全面了解用于自动化的网络架构。

**这是脚本小子成为工程师的地方。让我们开始吧。**

---

!!! info "文档状态"
    本模块综合了来自 RFC、协议规范、安全研究和真实世界测试的知识。每个代码示例都是可用于生产的。如果您发现不准确之处或有改进意见，欢迎贡献。

## 快速导航

**核心协议：**
- [网络基础](./network-fundamentals.md) - TCP/IP, UDP, WebRTC
- [HTTP/HTTPS 代理](./http-proxies.md) - 应用层代理
- [SOCKS 代理](./socks-proxies.md) - 会话层代理

**高级主题：**
- [代理检测](./proxy-detection.md) - 匿名与规避
- [构建代理](./build-proxy.md) - 从头开始实现
- [法律与道德](./proxy-legal.md) - 合规与责任

**相关模块：**
- [指纹识别](../fingerprinting/index.md) - 检测技术
- [浏览器配置](../../features/configuration/browser-options.md) - 实际设置

================================================
FILE: docs/zh/deep-dive/network/network-fundamentals.md
================================================
# 网络基础

本文档涵盖了驱动互联网的基础网络协议，以及它们如何在自动化场景中暴露或保护您的身份。充分理解 TCP、UDP、OSI 模型和 WebRTC，将使代理配置不再神秘，并且更加有效。

!!! info "模块导航"
    - [网络与安全概述](./index.md)：模块介绍和学习路径
    - [HTTP/HTTPS 代理](./http-proxies.md)：应用层代理
    - [SOCKS 代理](./socks-proxies.md)：会话层代理

    有关 Pydoll 的实际用法，请参阅[代理配置](../../features/configuration/proxy.md)和[浏览器选项](../../features/configuration/browser-options.md)。

## 网络堆栈

浏览器发出的每一个 HTTP 请求都会经过一个分层的网络堆栈。每一层都有特定的职责、协议和安全影响。代理在不同的层运行，运行的层决定了代理能看到、修改和隐藏什么。低层的网络特征即使通过代理也能对您的真实系统进行 fingerprinting，因此理解协议栈有助于了解身份泄露发生在哪里，以及如何防止它们。

### OSI 模型

OSI（开放系统互连）模型由 ISO 于 1984 年制定，提供了一个概念框架来理解网络协议是如何交互的。现实世界的网络使用 TCP/IP 模型（早于 OSI，只有 4 层），但 OSI 术语仍然是描述代理运行位置及其可访问内容的标准方式。

```mermaid
graph TD
    L7[Layer 7: Application - HTTP, FTP, SMTP, DNS]
    L6[Layer 6: Presentation - Encryption, Compression]
    L5[Layer 5: Session - SOCKS]
    L4[Layer 4: Transport - TCP, UDP]
    L3[Layer 3: Network - IP, ICMP]
    L2[Layer 2: Data Link - Ethernet, WiFi]
    L1[Layer 1: Physical - Cables, Radio Waves]

    L7 --> L6 --> L5 --> L4 --> L3 --> L2 --> L1
```

第 7 层（应用层）是面向用户的协议所在层：HTTP、HTTPS、FTP、SMTP 和 DNS 都在这里运行。这一层包含应用程序关心的实际数据，如 HTML 文档、JSON 响应和文件传输。HTTP 代理在这一层运行，因此对请求和响应内容具有完全的可见性。

第 6 层（表示层）处理数据格式转换、加密和压缩。SSL/TLS 通常与这一层关联，因为它承担加密职责，但实际上 TLS 横跨第 4 层到第 6 层，无法干净地映射到单个 OSI 层。对自动化来说重要的是，HTTPS 加密发生在这里，在数据传递到下层之前对第 7 层数据进行加密。

第 5 层（会话层）管理应用程序之间的连接。SOCKS 代理在这一层运行，低于应用层但高于传输层。这个位置使得 SOCKS 与协议无关：它可以代理任何第 7 层协议（HTTP、FTP、SMTP、SSH），而无需理解它们的具体内容。

第 4 层（传输层）提供端到端的数据传输。TCP（面向连接、可靠）和 UDP（无连接、快速）是这一层的主要协议。这一层处理端口号、流量控制和错误纠正。所有代理最终都依赖第 4 层进行实际的数据传输。

第 3 层（网络层）处理网络之间的路由和寻址。IP（互联网协议）在这一层运行，管理 IP 地址和路由决策。您的真实 IP 地址就在这一层，也是代理试图替换它的地方。

第 2 层（数据链路层）管理同一物理网段上的通信。以太网、Wi-Fi 和 PPP 在这里运行，处理 MAC 地址和帧传输。MAC 地址仅在本地网段可见，远程服务器无法直接访问，但它们可能通过 IPv6 SLAAC（将 MAC 嵌入地址中）等协议暴露。

第 1 层（物理层）是实际的硬件：电缆、无线电波和电压水平。与软件自动化几乎无关。

!!! tip "OSI vs TCP/IP"
    TCP/IP 模型（4 层：链路层、互联网层、传输层、应用层）是网络实际使用的模型。OSI（7 层）是教学工具和参考模型。当人们说"第 7 层代理"时，他们使用的是 OSI 术语，但实际实现运行在 TCP/IP 上。

### 层级位置如何影响代理

代理运行的层级决定了它能做什么和不能做什么。

HTTP/HTTPS 代理运行在第 7 层（应用层）。因为它们理解 HTTP，所以可以读取和修改 URL、标头、Cookie 和请求正文。它们可以根据 HTTP 语义智能缓存响应，按 URL 或关键字过滤内容，以及注入身份验证标头。代价是它们只理解 HTTP。它们无法代理 FTP、SMTP、SSH 或其他协议，而且检查 HTTPS 内容需要 TLS 终止，即解密然后重新加密流量。

SOCKS 代理运行在第 5 层（会话层）。因为它们位于应用层之下，所以与协议无关，可以在不修改的情况下代理任何第 7 层协议。HTTPS 流量以端到端加密方式通过，因为 SOCKS 代理无需对其解密。SOCKS5 还支持 UDP，使其能够代理 DNS 查询、VoIP 和其他基于 UDP 的协议。代价是 SOCKS 代理对应用层数据没有可见性：它们无法缓存、按 URL 过滤或检查内容。它们只能按 IP 和端口进行过滤。

!!! note "根本性的权衡"
    更高层（第 7 层）给您更多控制，但灵活性更低。更低层（第 5 层）给您更少控制，但灵活性更高。需要内容控制时选择 HTTP 代理，需要协议灵活性或端到端加密时选择 SOCKS 代理。

### 层泄露问题

即使有完美的第 7 层代理，低层的特征也能暴露您的真实身份。您操作系统的 TCP 堆栈在第 4 层有独特的 fingerprint，由窗口大小、选项顺序和 TTL 值定义。第 3 层的 IP 标头字段（如 TTL 和分片行为）会揭示您的操作系统和网络拓扑。

例如，如果您配置代理来显示 "Windows 10" 的 User-Agent，但您实际 Linux 系统的 TCP fingerprint 在第 4 层与此相矛盾，复杂的检测系统就能将这种不一致标记为强烈的机器人指标。这就是网络级 fingerprinting（在[网络指纹](../fingerprinting/network-fingerprinting.md)中介绍）如此危险的原因：它运行在代理层之下，即使应用层代理完美无缺，也会暴露您的真实系统。

## TCP vs UDP

在第 4 层（传输层），两种根本不同的协议主导着互联网通信。它们代表了相反的设计理念：可靠性与速度。

TCP 是面向连接的。可以把它想象成打电话：您建立连接，确认对方正在收听，可靠地交换数据，然后挂断。每个字节都会被确认、排序，并保证到达。UDP 是无连接的。您发送数据，希望它能到达。没有 handshake，没有确认，没有保证。只有原始的速度和最小的开销。

| 特性 | TCP | UDP |
|---------|-----|-----|
| 连接 | 面向连接（需要 handshake） | 无连接（无需 handshake） |
| 可靠性 | 保证交付，有序数据包 | 尽力而为交付，数据包可能丢失 |
| 速度 | 较慢（可靠性机制带来开销） | 较快（最小开销） |
| 用例 | 网页浏览、文件传输、电子邮件 | 视频流、DNS 查询、游戏 |
| 标头大小 | 最小 20 字节（带选项时可达 60） | 固定 8 字节 |
| 流量控制 | 有（滑动窗口，接收方驱动） | 无（发送方随意传输） |
| 拥塞控制 | 有（网络拥塞时减速） | 无（应用程序的责任） |
| 错误检查 | 广泛（校验和 + 确认） | 基本（仅校验和；在 IPv4 中可选，在 IPv6 中强制） |
| 排序 | 乱序接收时重新排序数据包 | 无排序，按接收顺序交付 |
| 重传 | 自动（丢失的数据包会重传） | 无（应用程序必须处理） |

### TCP 与代理

所有代理协议（HTTP、HTTPS、SOCKS4、SOCKS5）都使用 TCP 作为其控制通道。这是因为代理身份验证和命令交换需要保证交付，代理协议有严格的命令序列（handshake，然后认证，然后数据），代理需要持久连接来跟踪客户端状态。

然而，SOCKS5 还可以代理 UDP 流量，这与 SOCKS4 或 HTTP 代理不同。这使得 SOCKS5 对于代理 DNS 查询、WebRTC 音频/视频、VoIP 和游戏协议至关重要。

!!! danger "UDP 与 IP 泄露"
    大多数浏览器连接使用 TCP（HTTP、WebSocket 等），但 WebRTC 直接使用 UDP，绕过了浏览器的代理配置。这是代理浏览器自动化中 IP 泄露的最常见原因：您的 TCP 流量通过代理传输，而 UDP 流量却泄露了您的真实 IP。

### TCP 三次握手

在传输任何数据之前，TCP 需要三次 handshake 来建立连接。这个协商过程同步序列号，商定窗口大小，并在两端建立连接状态。

```mermaid
sequenceDiagram
    participant Client
    participant Server

    Client->>Server: SYN (Synchronize, seq=x)
    Note over Client,Server: Client requests connection

    Server->>Client: SYN-ACK (seq=y, ack=x+1)
    Note over Client,Server: Server acknowledges and sends its own SYN

    Client->>Server: ACK (ack=y+1)
    Note over Client,Server: Connection established, data transfer begins
```

该过程从客户端发送 SYN（同步）包开始，其中包含一个随机的初始序列号（ISN），例如 `seq=1000`。除了 ISN 之外，还会协商 TCP 选项：窗口大小、最大分段大小（MSS）、时间戳和 SACK 支持。

服务器以 SYN-ACK 响应：它选择自己的随机 ISN（例如 `seq=5000`），并通过设置 `ack=1001`（客户端的 ISN + 1）来确认客户端的 ISN。这个单一的包既建立了服务器到客户端的方向（SYN），又确认了客户端到服务器的方向（ACK）。服务器还会返回自己的 TCP 选项。

然后客户端发送最终的 ACK，确认服务器的 ISN（`ack=5001`）。此时连接在两个方向上都已完全建立，数据传输可以开始。

ISN 是随机化的而非从零开始，以防止 TCP 劫持攻击。如果 ISN 是可预测的，攻击者可以通过猜测序列号将数据包注入到现有连接中。现代系统使用加密随机性来选择 ISN（RFC 6528）。

### TCP Fingerprinting

TCP handshake 揭示了能够 fingerprint 您操作系统的特征。不同操作系统对初始窗口大小、TCP 选项顺序、TTL（生存时间）、窗口缩放因子和时间戳行为使用不同的默认值。这些值由内核设置，而不是浏览器，因此代理无法更改它们。

以下是现代操作系统的示例值。请注意，实际值因操作系统版本、内核配置和网络调优而异：

```
Windows 10/11 (modern builds):
    Window Size: 65535
    MSS: 1460
    Options: MSS, NOP, WS, NOP, NOP, SACK_PERM
    TTL: 128

Linux (kernel 5.x+, Ubuntu 20.04+):
    Window Size: 29200
    MSS: 1460
    Options: MSS, SACK_PERM, TS, NOP, WS
    TTL: 64

macOS (Monterey+):
    Window Size: 65535
    TTL: 64
```

这些差异烙印在内核中。代理无法更改它们，因为它们是由您的操作系统而不是浏览器设置的。这就是复杂的检测系统即使通过代理也能识别您的原因。

!!! warning "代理的局限性"
    HTTP 和 SOCKS 代理运行在 TCP 层之上。它们无法修改 TCP handshake 特征。您操作系统的 TCP fingerprint 始终暴露给代理服务器以及您和代理之间的任何网络观察者。只有 VPN 级别的解决方案或操作系统级的 TCP 堆栈配置才能解决这个问题。

!!! note "TCP Fingerprinting 之外"
    TCP handshake 只是第一个 fingerprinting 机会。紧接着，TLS handshake 会揭示另一个独特的 fingerprint，即 JA3/JA4。详情请参阅[网络指纹](../fingerprinting/network-fingerprinting.md)。

### UDP

与 TCP 可靠、面向连接的方法不同，UDP 是一种"发射后不管"的协议。它以可靠性换取最小的延迟和开销，使其成为实时应用的理想选择，因为在这些应用中速度比完美交付更重要。

UDP 数据报只有 8 字节标头（相比 TCP 的 20-60 字节），包含源端口、目标端口、长度和校验和。没有连接建立，没有可靠性保证，没有流量控制，没有拥塞控制。如果数据包丢失，应用程序必须自行决定是否以及如何处理。

UDP 适用于实时通信（通过 WebRTC 和 VoIP 进行的语音/视频通话）、游戏（低延迟的状态更新）、流媒体（偶尔的帧丢失可以接受）和 DNS 查询（小型请求/响应对，应用程序处理重试）。它不适合文件传输、网页浏览、电子邮件或数据库，这些都需要可靠、有序的交付。

DNS 在自动化上下文中是一个特别重要的例子。DNS 使用 UDP 是因为查询通常很小，并且受益于 UDP 零 handshake 的开销优势。虽然 EDNS0（RFC 6891）将最大 UDP DNS 负载增加到了原始 512 字节限制之上，但大多数查询仍然很紧凑。如果响应未在超时时间内到达，DNS 客户端会在应用层处理重试。

对于浏览器自动化，UDP 的关键问题是 WebRTC 使用它进行实时音频和视频，DNS 查询使用它进行域名解析，而大多数代理（HTTP、HTTPS、SOCKS4）只处理 TCP。除非您显式配置 UDP 代理，否则这些流量会绕过您的代理并泄露您的真实 IP。

| 代理类型 | UDP 支持 | 说明 |
|------------|-------------|-------|
| HTTP 代理 | 否 | 只代理基于 TCP 的 HTTP/HTTPS |
| HTTPS 代理 (CONNECT) | 否 | CONNECT 方法只建立 TCP 隧道 |
| SOCKS4 | 否 | 仅 TCP 协议 |
| SOCKS5 | 是 | 通过 `UDP ASSOCIATE` 命令支持 UDP 中继 |
| VPN | 是 | 隧道传输所有 IP 流量（TCP 和 UDP） |

为了在浏览器自动化中实现真正的匿名，您需要：支持 UDP 的 SOCKS5 代理并将 WebRTC 配置为使用它、完全禁用 WebRTC（这会破坏视频会议）、隧道传输所有流量的 VPN，或者浏览器标志 `--force-webrtc-ip-handling-policy=disable_non_proxied_udp`。

### QUIC 与 HTTP/3

现代浏览器越来越多地使用 QUIC（RFC 9000），这是一种基于 UDP 的传输协议，为 HTTP/3 提供支持。由于 QUIC 运行在 UDP 上，它与 WebRTC 和 DNS 存在相同的代理绕过问题：大多数 HTTP 代理无法处理 QUIC 流量，它可能会泄露到您的代理配置之外。

在自动化场景中，考虑使用 `--disable-quic` Chrome 标志禁用 QUIC，以强制使用基于 TCP 的 HTTP/2，确保所有网页流量通过您的代理。QUIC 还有自己的 fingerprinting 特征，类似于 TLS 的 JA3，增加了另一个检测向量。

## WebRTC 与 IP 泄露

WebRTC（Web 实时通信）是 W3C 标准化的浏览器 API，支持浏览器之间直接进行点对点的音频、视频和数据通信，无需插件或中介服务器。虽然 WebRTC 对实时应用功能强大，但它是代理浏览器自动化中最大的 IP 泄露源。

### WebRTC 如何泄露您的 IP

WebRTC 专为直接的点对点连接设计，优先考虑低延迟而非隐私。为了建立 P2P 连接，WebRTC 必须发现您的真实公共 IP 地址并与远程对等方共享，即使您的浏览器配置为使用代理。

问题是这样展开的：您的浏览器使用代理处理 HTTP/HTTPS 流量（即 TCP），但 WebRTC 使用 STUN 服务器通过 UDP 发现您的真实公共 IP。STUN 查询绕过代理，因为大多数代理只处理 TCP。您的真实 IP 被发现并作为连接协商的一部分与远程对等方共享。页面上的 JavaScript 可以读取这些"ICE 候选者"并将您的真实 IP 发送到网站的服务器。

!!! danger "WebRTC 泄露的严重性"
    即使正确配置了 HTTP 代理、HTTPS 代理工作正常、DNS 查询被代理、User-Agent 被伪造、canvas fingerprinting 被缓解，WebRTC 仍然可以在毫秒内泄露您的真实 IP。这是因为 WebRTC 运行在浏览器的代理层之下，直接与操作系统的网络堆栈交互。

### ICE 过程

WebRTC 使用 ICE（交互式连接建立，RFC 8445）来发现可能的连接路径并选择最佳路径。这个过程本身就会揭示您的网络拓扑，它收集三种类型的候选者。

```mermaid
sequenceDiagram
    participant Browser
    participant STUN as STUN Server
    participant TURN as TURN Relay
    participant Peer as Remote Peer

    Note over Browser: WebRTC connection initiated

    Browser->>Browser: Gather local IP addresses<br/>(LAN interfaces)
    Note over Browser: Local candidate:<br/>192.168.1.100:54321

    Browser->>STUN: STUN Binding Request (over UDP)
    Note over STUN: STUN server discovers public IP<br/>(bypasses proxy!)
    STUN->>Browser: STUN Response with real public IP
    Note over Browser: Server reflexive candidate:<br/>203.0.113.45:54321

    Browser->>TURN: Allocate relay (if needed)
    TURN->>Browser: Relay address assigned
    Note over Browser: Relay candidate:<br/>198.51.100.10:61234

    Browser->>Peer: Send all ICE candidates<br/>(local + public + relay)
    Note over Peer: Now knows your:<br/>- LAN IP<br/>- Real public IP<br/>- Relay address

    Peer->>Browser: Send ICE candidates

    Note over Browser,Peer: ICE negotiation: try direct P2P first

    alt Direct P2P succeeds
        Browser<<->>Peer: Direct connection (bypasses proxy entirely!)
    else Direct P2P fails (firewall/NAT)
        Browser->>TURN: Use TURN relay
        TURN<<->>Peer: Relayed connection
        Note over Browser,Peer: Higher latency, but works
    end
```

### ICE 候选者类型

ICE 发现三种类型的候选者（可能的连接端点），每种类型揭示关于您网络的不同信息。

**主机候选者**是您的本地局域网 IP 地址。浏览器枚举所有本地网络接口，并为每个接口创建候选者。这会揭示您在专用网络上的本地 IP 地址、网络拓扑（是否存在 VPN 接口、虚拟机网桥）以及网络接口的数量。

```javascript
// Example host candidates
candidate:1 1 UDP 2130706431 192.168.1.100 54321 typ host
candidate:2 1 UDP 2130706431 10.0.0.5 54322 typ host
```

现代浏览器（Chrome 75+、Firefox 78+、Safari）通过在未授予媒体权限（摄像头/麦克风）时将本地 IP 地址替换为临时的 mDNS 名称（例如 `a1b2c3d4.local`）来缓解主机候选者泄露。然而，无论 mDNS 如何，服务器自反候选者（您的公共 IP）仍然会暴露。

**服务器自反候选者**是 STUN 服务器看到的您的公共 IP。浏览器向公共 STUN 服务器发送请求，后者回复您的公共 IP 地址。这就是人们常说的泄露：您的代理显示一个 IP，但 WebRTC 揭示了您的真实 IP，连同您的 NAT 类型、外部端口映射和 ISP 信息。

```javascript
// Server reflexive candidate (your real public IP)
candidate:4 1 UDP 1694498815 203.0.113.45 54321 typ srflx raddr 192.168.1.100 rport 54321
```

**中继候选者**是在直接 P2P 失败时用作后备的 TURN 服务器地址。根据 TURN 服务器实现的不同，中继候选者的 `raddr`（远程地址）字段中可能仍然包含您的真实 IP。

```javascript
// Relay candidate (TURN server address)
candidate:5 1 UDP 16777215 198.51.100.10 61234 typ relay raddr 203.0.113.45 rport 54321
```

### STUN 协议

STUN（NAT 会话穿透实用工具，RFC 8489）是一个简单的基于 UDP 的请求-响应协议。它的工作很直接：客户端询问"您看到的我是什么 IP？"，服务器回复客户端的公共 IP 和端口。

客户端发送一个绑定请求，其中包含一个魔法 Cookie（`0x2112A442`，RFC 定义的固定值）和一个随机的 12 字节事务 ID。服务器响应一个绑定成功响应，其中包含一个 `XOR-MAPPED-ADDRESS` 属性，包含从服务器角度看到的客户端公共 IP 和端口。

响应中的 IP 地址与魔法 Cookie 和事务 ID 进行了异或运算。这不是为了安全，而是为了 NAT 兼容性：一些 NAT 设备会错误地修改数据包负载中的 IP 地址，异或运算混淆了地址以防止这种干扰。

浏览器常用的公共 STUN 服务器包括 `stun.l.google.com:19302`（Google）、`stun1.l.google.com:19302`（Google）、`stun.services.mozilla.com`（Mozilla）和 `stun.stunprotocol.org:3478`。

### 为什么代理无法阻止 WebRTC 泄露

WebRTC 泄露发生有几个相互强化的原因。首先，WebRTC 使用 UDP，而大多数代理（HTTP、HTTPS CONNECT、SOCKS4）只处理 TCP。只有 SOCKS5 支持 UDP，即便如此，浏览器也必须显式配置为通过它路由 WebRTC。

其次，WebRTC 是一个运行在 HTTP 层之下的浏览器 API。它直接访问操作系统网络堆栈，绕过为 HTTP/HTTPS 配置的代理设置。STUN 查询直接进入网络接口，操作系统路由表决定它们的路径，而不是浏览器的代理配置。只有 VPN 级别的路由才能拦截它们。

第三，WebRTC 枚举所有网络接口（物理以太网、Wi-Fi、VPN 适配器、虚拟机网桥），包括未用于常规浏览的接口。这会泄露您的内部网络拓扑。

最后，网页可以通过 JavaScript 使用 `RTCPeerConnection.onicecandidate` 事件读取 ICE 候选者，用简单的正则表达式从候选者字符串中提取 IP 地址，并将您的真实 IP 发送到他们的跟踪服务器。

### 在 Pydoll 中防止 WebRTC 泄露

Pydoll 提供了多种策略来防止 WebRTC IP 泄露。

**方法 1：强制 WebRTC 仅使用代理路由（推荐）**

```python
from pydoll.browser import Chrome
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.webrtc_leak_protection = True  # Adds --force-webrtc-ip-handling-policy=disable_non_proxied_udp
```

Pydoll 提供了一个便捷的 `webrtc_leak_protection` 属性来管理底层的 Chrome 标志。这会在没有代理支持 UDP 时禁用 UDP，强制 WebRTC 仅使用 TURN 中继（不使用直接 P2P），并阻止对公共服务器的 STUN 查询。代价是视频通话的延迟更高，因为直接 P2P 连接被禁用。

**方法 2：完全禁用 WebRTC**

```python
options.add_argument('--disable-features=WebRTC')
```

这会完全禁用 WebRTC API，消除通过此向量发生 IP 泄露的任何可能性。代价是所有依赖 WebRTC 的网站（视频会议、语音通话）将无法工作。请注意，此标志应在您的特定 Chrome 版本上测试，因为功能标志名称可能因版本而异。

**方法 3：通过浏览器首选项限制 WebRTC**

```python
options.browser_preferences = {
    'webrtc': {
        'ip_handling_policy': 'disable_non_proxied_udp',
        'multiple_routes_enabled': False,
        'nonproxied_udp_enabled': False,
        'allow_legacy_tls_protocols': False
    }
}
```

这与方法 1 效果相同，但通过首选项而非命令行标志实现。`multiple_routes_enabled` 防止使用多个网络路径，`nonproxied_udp_enabled` 阻止不通过代理的 UDP。

**方法 4：使用支持 UDP 的 SOCKS5 代理**

```python
options.add_argument('--proxy-server=socks5://proxy.example.com:1080')
options.add_argument('--force-webrtc-ip-handling-policy=default_public_interface_only')
```

SOCKS5 可以通过其 `UDP ASSOCIATE` 命令代理 UDP，允许 WebRTC 的 STUN 查询通过代理。这需要实际支持 UDP 中继的 SOCKS5 代理，而并非所有代理都支持。

!!! warning "SOCKS5 身份验证"
    Chrome 不支持通过 `--proxy-server` 标志内联 SOCKS5 身份验证（例如 `socks5://user:pass@host:port`）。Pydoll 提供了内置的 `SOCKS5Forwarder` 来解决此限制，它运行一个本地无需身份验证的 SOCKS5 代理，将流量转发到远程经过身份验证的代理，代替 Chrome 处理用户名/密码 handshake。详情请参阅[代理配置](../../features/configuration/proxy.md)。

### 测试 WebRTC 泄露

您可以通过访问 [browserleaks.com/webrtc](https://browserleaks.com/webrtc) 并检查"Public IP Address"部分来手动测试。如果您看到的是您的真实 IP 而不是代理 IP，则说明存在泄露。

使用 Pydoll 进行自动化测试：

```python
import asyncio
from pydoll.browser import Chrome
from pydoll.browser.options import ChromiumOptions

async def test_webrtc_leak():
    options = ChromiumOptions()
    options.add_argument('--proxy-server=http://proxy.example.com:8080')
    options.add_argument('--force-webrtc-ip-handling-policy=disable_non_proxied_udp')

    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://browserleaks.com/webrtc')

        await asyncio.sleep(3)

        ips = await tab.execute_script('''
            return Array.from(document.querySelectorAll('.ip-address'))
                .map(el => el.textContent.trim());
        ''')

        print("Detected IPs:", ips)
        # Should only show proxy IP, not your real IP

asyncio.run(test_webrtc_leak())
```

!!! danger "务必测试 WebRTC 泄露"
    切勿假设您的代理配置能阻止 WebRTC 泄露。始终使用 [browserleaks.com/webrtc](https://browserleaks.com/webrtc) 或 [ipleak.net](https://ipleak.net) 进行验证。即使是单个 WebRTC 泄露也会立即危及您的整个代理设置，因为网站现在知道了您的真实位置、ISP 和网络拓扑。

### 网站如何利用 WebRTC 泄露

网站可以用几行 JavaScript 有意触发 WebRTC 来提取您的真实 IP：

```javascript
const pc = new RTCPeerConnection({
    iceServers: [{urls: 'stun:stun.l.google.com:19302'}]
});

pc.createDataChannel('');
pc.createOffer().then(offer => pc.setLocalDescription(offer));

pc.onicecandidate = (event) => {
    if (event.candidate) {
        const ipRegex = /([0-9]{1,3}(\.[0-9]{1,3}){3})/;
        const ipMatch = event.candidate.candidate.match(ipRegex);

        if (ipMatch) {
            const realIP = ipMatch[1];
            fetch(`/track?real_ip=${realIP}&proxy_ip=${window.clientIP}`);
        }
    }
};
```

这段代码创建一个 RTCPeerConnection，触发 ICE 候选者收集（联系 STUN 服务器），用正则表达式从候选者中提取 IP 地址，并将您的真实 IP 发送到跟踪服务器。按照上述方法禁用 WebRTC 或强制仅使用代理路由可以防止这种情况。

## 总结

代理运行在网络堆栈的特定层：HTTP 在第 7 层，SOCKS 在第 5 层。层级决定了代理能看到、修改和隐藏什么。TCP fingerprint（窗口大小、选项、TTL）从低层泄露，即使通过代理也会揭示您的真实操作系统。UDP 流量（包括 WebRTC 和 DNS）除非显式配置，否则通常会绕过代理。WebRTC 是 IP 泄露最常见的来源，只有 SOCKS5 或 VPN 才能有效代理 UDP 流量。现代浏览器还使用 QUIC（基于 UDP 的 HTTP/3），增加了另一个潜在的绕过向量。

**后续步骤：**

- [HTTP/HTTPS 代理](./http-proxies.md)：应用层代理
- [SOCKS 代理](./socks-proxies.md)：会话层、协议无关的代理
- [网络指纹](../fingerprinting/network-fingerprinting.md)：TCP/IP 和 TLS fingerprinting 技术
- [代理配置](../../features/configuration/proxy.md)：实用 Pydoll 代理设置

## 参考资料

- RFC 793: Transmission Control Protocol (TCP) - https://tools.ietf.org/html/rfc793
- RFC 768: User Datagram Protocol (UDP) - https://tools.ietf.org/html/rfc768
- RFC 8489: Session Traversal Utilities for NAT (STUN) - https://tools.ietf.org/html/rfc8489
- RFC 8445: Interactive Connectivity Establishment (ICE) - https://tools.ietf.org/html/rfc8445
- RFC 8656: Traversal Using Relays around NAT (TURN) - https://tools.ietf.org/html/rfc8656
- RFC 6528: Defending Against Sequence Number Attacks - https://tools.ietf.org/html/rfc6528
- RFC 9000: QUIC: A UDP-Based Multiplexed and Secure Transport - https://tools.ietf.org/html/rfc9000
- W3C WebRTC 1.0: Real-Time Communication Between Browsers - https://www.w3.org/TR/webrtc/
- BrowserLeaks: WebRTC Leak Test - https://browserleaks.com/webrtc
- IPLeak: Comprehensive Leak Testing - https://ipleak.net


================================================
FILE: docs/zh/deep-dive/network/proxy-detection.md
================================================
# Proxy 检测

Proxy 检测是一个概率性过程。网站结合数十种信号来评估连接是否经过 proxy，从简单的 IP 信誉查询到 TCP/IP 协议栈分析和行为画像，不一而足。任何单一信号都无法提供确定性证据，但将足够多的弱信号组合在一起，就能产生高置信度的判断。

本文档涵盖主要的检测技术、其技术层面的工作原理，以及它们对使用 Pydoll 进行浏览器自动化意味着什么。

!!! info "模块导航"
    - [SOCKS Proxy](./socks-proxies.md)：会话层代理
    - [HTTP/HTTPS Proxy](./http-proxies.md)：应用层代理
    - [网络基础](./network-fundamentals.md)：TCP/IP、UDP、WebRTC

    有关 fingerprinting 的详细信息，请参阅[网络 Fingerprinting](../fingerprinting/network-fingerprinting.md) 和[浏览器 Fingerprinting](../fingerprinting/browser-fingerprinting.md)。

## IP 信誉

IP 信誉分析是部署最广泛的 proxy 检测技术。它结合公开可用的数据（ASN 记录、WHOIS、地理定位数据库）和专有情报，将 IP 地址分类为不同的风险等级。

### ASN 分类

每个 IP 地址都属于一个自治系统（AS），由 ASN 标识。拥有该 IP 的 AS 类型是判断其是否为 proxy 的最强单一指标。

属于云服务和托管提供商（AWS、DigitalOcean、OVH、Hetzner）的 IP 被标记为高风险，因为真实用户不会从数据中心服务器浏览网页。来自住宅 ISP（Comcast、Deutsche Telekom、BT）的 IP 风险较低，因为它们看起来像普通的家庭连接。移动运营商 IP（Verizon Wireless、AT&T Mobility）风险最低，因为它们最难与真实的移动用户区分开来。

一些 ASN 与已知的 proxy 基础设施相关联，但这比表面看起来更复杂。像 BrightData 或 Smartproxy 这样的大型住宅 proxy 提供商并不运营自己的 ASN；它们通过属于 ISP ASN 的真实住宅 IP 路由流量。这正是住宅 proxy 比数据中心 proxy 更难检测的原因。

检测系统查询 ASN 数据库（Team Cymru、RIPE NCC、ARIN）和商业 IP 情报 API 来分类每个连接 IP。数据中心 IP 的检测准确率大约在 95% 以上，因为 ASN 分类是明确的。住宅 proxy 的检测要困难得多（准确率大约 40-70%），因为这些 IP 确实属于 ISP。移动 proxy 的检测最为困难（大约 20-40%），因为移动运营商 NAT 使许多真实用户共享 IP。

这种准确率梯度正是住宅和移动 proxy 价格比数据中心 proxy 高出 10-100 倍的原因。

### 已知 Proxy 数据库

除了 ASN 分类之外，专门的数据库会追踪已被观察到参与 proxy 网络的 IP。IPQualityScore、proxycheck.io 和 Spur.us 等服务维护着已知 proxy、VPN 和 Tor 出口节点 IP 的实时数据库。Tor 出口节点列表可在 [check.torproject.org](https://check.torproject.org/torbulkexitlist) 公开获取。

这些数据库还会追踪行为信号：频繁轮换的 IP（proxy 池的典型特征）、并发会话数异常高的 IP（住宅 IP 通常只有 1-5 个并发连接，而不是 100+），以及之前与机器人行为关联的 IP。

### 地理位置一致性

Proxy 经常通过地理不一致性暴露自己。IP 地址指向一个位置，但浏览器报告的信号指向另一个位置。

最常见的不匹配包括：IP 地理位置与浏览器时区之间的不匹配（通过 JavaScript 的 `Intl.DateTimeFormat().resolvedOptions().timeZone` 收集）、IP 所在国家与 `Accept-Language` 标头之间的不匹配，以及当前会话位置与上一个会话位置之间的不匹配。一个出现在洛杉矶但浏览器时区为 `Europe/Berlin` 的用户是可疑的。一个在上一次会话位于纽约后 10 分钟出现在东京的用户在物理上是不可能的。

检测系统还会检查 IP 的地理位置是否与浏览器的区域配置匹配。一个美国数据中心 IP 配上 `Accept-Language: zh-CN` 和时区 `Asia/Shanghai`，强烈暗示这是一个通过美国 proxy 路由的中国用户。

!!! note "误报"
    合法场景也会触发地理位置警报：使用 VPN 的旅行者、浏览器设置保留母国配置的外籍人士、通过公司 VPN 连接的企业用户，以及使用非默认语言偏好的多语言用户。成熟的系统使用风险评分而非二元阻断来处理这些情况。

## HTTP 标头分析

HTTP 标头是最简单的检测途径。透明和匿名 proxy 会添加 `Via`、`X-Forwarded-For`、`X-Real-IP` 和 `Forwarded`（RFC 7239）等标头，直接暴露 proxy 的使用。精英 proxy 会剥离这些标头，但仅凭其缺失并不能证明是直连。

检测不仅限于寻找 proxy 专有标头。缺少真实浏览器总会发送的标头（如 `Accept-Language`、`Accept-Encoding` 或真实的 `User-Agent`）也很可疑。标头顺序同样重要：浏览器以一致的、版本特定的顺序发送标头，手动构造标头的 proxy 或自动化工具往往会搞错顺序。

旧版 `Proxy-Connection: keep-alive` 标头是另一个经典的检测信号，某些老旧客户端在通过 proxy 路由时会发送此标头。

### Proxy 匿名级别

Proxy 传统上根据其标头行为被分为三个匿名级别：

| 级别 | 行为 | 检测难度 |
|------|------|----------|
| 透明 | 在 `X-Forwarded-For` 中转发你的真实 IP，添加 `Via` 标头 | 极易检测 |
| 匿名 | 隐藏你的 IP 但添加 `Via` 或其他 proxy 标头 | 容易检测 |
| 精英 | 剥离所有标识 proxy 的标头 | 需要更深入的分析 |

这种分类来自 HTTP 标头分析作为主要检测方法的时代。现代检测系统使用 IP 信誉、fingerprinting 和行为分析，使得透明/匿名/精英的区分不再那么有意义。一个使用数据中心 IP 的精英 proxy 通过 ASN 查询就能立即被检测到。而一个使用住宅 IP 的透明 proxy 在不太成熟的网站上可能仍然不会被发现。

## 网络 Fingerprinting

网络层 fingerprinting 在 proxy 层之下运作，这意味着即使 proxy 本身配置完美，它也能检测到 proxy 的使用。

### TCP/IP Fingerprinting

每个操作系统都有独特的 TCP 协议栈实现，在 TCP 握手过程中会暴露出来。初始窗口大小、TCP 选项顺序、TTL（生存时间）和窗口缩放因子都由内核设置，而非浏览器，且无法被 proxy 更改。

检测系统将这些 TCP 特征与 `User-Agent` 标头进行比较。如果 User-Agent 声称是 Windows 10，但 TCP fingerprint 显示 Linux 特征（TTL 为 64，窗口大小为 29200），这种不匹配就是一个强 proxy 指标。Windows 使用默认 TTL 128，现代版本通常显示窗口大小 65535，而 Linux 使用 TTL 64，窗口大小约 29200。

TTL 分析增加了另一个层面。TTL 在每个网络跳点递减 1。如果一个 Windows 连接到达时 TTL 为 128，客户端很可能在同一网络上。如果到达时 TTL 为 115，则它经过了大约 13 个跳点。如果 TTL 值与 IP 地理位置的预期跳数不一致，则很可能存在 proxy 路由。

有关 TCP fingerprint 值及其含义的详细信息，请参阅[网络 Fingerprinting](../fingerprinting/network-fingerprinting.md)。

### TLS Fingerprinting（JA3/JA4）

TLS ClientHello 消息以明文传输，包含足够的参数来唯一标识客户端应用程序：TLS 版本、支持的密码套件、扩展、椭圆曲线和签名算法。JA3 fingerprint 是将这些参数按特定顺序拼接后的 MD5 哈希值。JA4 是一种更新、更细粒度的替代方案。

每个浏览器版本都会产生独特的 JA3/JA4 fingerprint。检测系统维护着 Chrome、Firefox、Safari 和其他浏览器的已知 fingerprint 数据库。如果 JA3 fingerprint 与任何已知浏览器不匹配，或者与 User-Agent 中声称的浏览器不匹配，该连接就会被标记。

一个重要的细节：SOCKS5 proxy 和 HTTP CONNECT 隧道会原样传递 TLS ClientHello，因此目标服务器看到的是真实浏览器的 fingerprint。在这些配置中，proxy 不会改变 TLS 参数。只有 MITM proxy（终止并重新建立 TLS 连接的 proxy）才会改变 fingerprint，在这种情况下 fingerprint 属于 proxy 软件而非真实浏览器，这本身就是一个检测信号。

### HTTP/2 Fingerprinting

HTTP/2 连接暴露出与 TLS 不同的 fingerprinting 信号。HTTP/2 连接开始时发送的 SETTINGS 帧包含 `HEADER_TABLE_SIZE`、`MAX_CONCURRENT_STREAMS`、`INITIAL_WINDOW_SIZE` 和 `MAX_HEADER_LIST_SIZE` 等参数。每个浏览器对这些设置使用不同的默认值。

伪标头（`:method`、`:authority`、`:scheme`、`:path`）的顺序和优先级、HPACK 压缩行为以及流优先级权重在不同浏览器之间也有所不同。[browserleaks.com/http2](https://browserleaks.com/http2) 等工具可以展示你的 HTTP/2 fingerprint 是什么样的。

实现了自己 HTTP/2 协议栈的自动化框架和 proxy 软件通常会产生与任何真实浏览器都不匹配的 fingerprint，使其成为一种有效的检测途径。

### 基于延迟的检测

客户端与服务器之间的网络延迟揭示了物理网络路径的信息。如果 IP 地理定位在纽约，但往返时间暗示路径经过了亚洲，则该连接很可能经过了 proxy。

检测系统在 TCP 握手期间测量 RTT（往返时间），并将其与 IP 地理位置的预期延迟进行比较。它们还可能发起基于 JavaScript 的计时挑战，从浏览器角度测量延迟，然后将其与服务器观察到的延迟进行比较。两者之间的显著差异暗示路径中存在中间节点（proxy）。

时钟偏移分析增加了另一个维度：通过 JavaScript（`Date.now()`）或 HTTP `Date` 标头测量客户端的时钟偏移量，检测系统可以推断客户端的实际时区，并将其与 IP 预期时区进行比较。

## 行为检测

最先进的检测系统超越了网络和协议分析，转而检查用户行为。这包括请求时序（请求是否均匀间隔，暗示自动化？）、鼠标移动模式（通过 JavaScript 事件监听器分析）、滚动行为、键盘输入节奏以及整体浏览模式。

基于数百万真实用户会话训练的机器学习模型能够以高准确率区分人类行为和自动化行为。这些模型通常结合 50 多个特征，包括导航模式、会话持续时间分布、点击位置、表单交互时序和 JavaScript 执行特征。

Pydoll 的人性化交互（贝塞尔曲线鼠标移动、Fitts 定律时序、真实的打字节奏）专为通过行为分析而设计。请参阅[规避技术](../fingerprinting/evasion-techniques.md)了解完整的多层规避策略。

## 多信号风险评分

现代检测系统不依赖任何单一技术。它们将所有可用信号组合成一个风险评分（通常为 0-100），并应用因行业和场景而异的阈值。

每类信号的权重各不相同，但粗略来说，IP 信誉占最大份额（它是最廉价且最可靠的信号），其次是网络 fingerprinting（TCP/IP、TLS、HTTP/2）、标头和协议分析、行为评分，以及一致性检查（地理位置、时区、语言）。

阈值取决于业务场景。银行网站阻断策略激进（风险评分超过 50 即阻断），电商网站在中等评分时展示 CAPTCHA（超过 70），内容网站则更为宽松（仅在超过 80 时阻断），因为它们依赖广告展示量。

这对自动化的启示是，仅通过一层检测是不够的。一个住宅 IP（良好的 IP 信誉）如果配上不匹配的 TCP fingerprint 和机器人行为，仍然会被标记。有效的规避需要所有层面的一致性。

## 按 Proxy 类型划分的检测难度

| Proxy 类型 | 检测难度 | 主要检测方法 |
|------------|----------|-------------|
| 透明 HTTP | 极易 | HTTP 标头（`Via`、`X-Forwarded-For`） |
| 匿名 HTTP | 容易 | HTTP 标头 + IP 信誉 |
| 精英 HTTP（数据中心） | 中等 | IP 信誉（ASN 分析） |
| 数据中心 SOCKS5 | 中等 | IP 信誉（ASN 分析） |
| 住宅 proxy | 困难 | 行为分析、连接模式、延迟 |
| 移动 proxy | 非常困难 | 主要靠行为分析，网络信号有限 |
| 轮换 proxy | 困难 | 会话不一致、IP 轮换模式 |

## 规避原则

有效的规避在于所有检测层面的一致性，而不是完善任何单一层面。

当隐蔽性重要时，使用住宅或移动 IP。它们更难被检测，因为这些 IP 确实属于 ISP，价格溢价反映了这一优势。将浏览器的地理位置信号（时区、语言、区域设置）与 proxy IP 的位置匹配。通过不在会话中途轮换 IP 来保持会话持久性，因为这会产生可检测的不连续性。确保你的 TCP/IP fingerprint 与 User-Agent 声明匹配，方法是在你所模拟的相同操作系统上运行自动化。使用 Pydoll 的人性化交互来通过行为分析。并且在大规模运行自动化之前，始终测试是否存在泄露（WebRTC、DNS、时区）。

目标不是使检测变得不可能，而是使其变得昂贵和不确定。迫使检测系统使用多个关联信号，融入合法流量模式，并创造合理的否认空间。

!!! warning "没有 Proxy 是不可检测的"
    拥有足够资源的情况下，任何 proxy 都可以被检测到。即使是顶级住宅 proxy 在面对 Akamai、Cloudflare Enterprise 和 DataDome 等成熟的反机器人系统时，成功率也大约只有 70-90%。实际问题在于，对于目标网站来说，检测是否在经济上值得。

**后续阅读：**

- [网络 Fingerprinting](../fingerprinting/network-fingerprinting.md)：TCP/IP 和 TLS fingerprinting 详解
- [浏览器 Fingerprinting](../fingerprinting/browser-fingerprinting.md)：Canvas、WebGL、HTTP/2 fingerprinting
- [规避技术](../fingerprinting/evasion-techniques.md)：多层规避策略
- [Proxy 配置](../../features/configuration/proxy.md)：Pydoll proxy 实用配置指南

## 参考资料

- MaxMind GeoIP2: https://www.maxmind.com/en/geoip2-services-and-databases
- IPQualityScore Proxy Detection: https://www.ipqualityscore.com/proxy-vpn-tor-detection-service
- Spur.us (Anonymous IP Detection): https://spur.us/
- Team Cymru IP to ASN Mapping: https://www.team-cymru.com/ip-asn-mapping
- Salesforce Engineering: TLS Fingerprinting with JA3 and JA3S - https://engineering.salesforce.com/tls-fingerprinting-with-ja3-and-ja3s-247362855967/
- Akamai: Passive Fingerprinting of HTTP/2 Clients (Black Hat EU 2017) - https://blackhat.com/docs/eu-17/materials/eu-17-Shuster-Passive-Fingerprinting-Of-HTTP2-Clients-wp.pdf
- Incolumitas: TCP/IP Fingerprinting for VPN and Proxy Detection - https://incolumitas.com/2021/03/13/tcp-ip-fingerprinting-for-vpn-and-proxy-detection/
- Incolumitas: Detecting Proxies and VPNs with Latencies - https://incolumitas.com/2021/06/07/detecting-proxies-and-vpn-with-latencies/
- BrowserLeaks HTTP/2 Fingerprint: https://browserleaks.com/http2
- BrowserLeaks IP: https://browserleaks.com/ip
- RFC 7239: Forwarded HTTP Extension - https://www.rfc-editor.org/rfc/rfc7239.html
- RFC 9110: HTTP Semantics - https://www.rfc-editor.org/rfc/rfc9110.html


================================================
FILE: docs/zh/deep-dive/network/proxy-legal.md
================================================
# 法律和道德考量

本文档提供了有关代理使用和网络自动化法律及道德环境的 **一般信息**。法律因司法管辖区和用例而异。本文 **不构成法律建议**。请务务必就您的具体情况咨询合格的法律顾问。

!!! info "模块导航"
    - **[← 构建代理](./build-proxy.md)** - 实现与高级主题
    - **[← 代理检测](./proxy-detection.md)** - 匿名与规避
    - **[← 网络与安全概述](./index.md)** - 模块介绍
    
    有关负责任的自动化，请参阅 **[行为验证码绕过](../../features/advanced/behavioral-captcha-bypass.md)** 和 **[类人交互](../../features/automation/human-interactions.md)**。

!!! danger "法律免责声明"
    本文档仅提供 **教育信息**。它 **不是法律建议**。有关网络抓取、自动化和代理使用的法律因司法管辖区而异，并可能受到解释的影响。在从事可能具有法律影响的活动之前，请咨询合格的法律顾问。

## 法律和道德考量

代理的使用处于隐私、安全和合规的交叉点。了解法律环境对于负责任的自动化至关重要。

### 法规遵从

不同的司法管辖区对代理使用和数据收集有不同的规定：

| 地区 | 关键法规 | 对代理的影响 |
|---|---|---|
| **欧盟** | GDPR | IP 地址是个人数据；欧盟的代理出口节点必须合规 |
| **美国** | CFAA, 州法律 | 规避访问控制可能违反计算机欺诈法 |
| **中国** | 网络安全法 | VPN/代理使用受到严格监管；只允许经批准的服务 |
| **俄罗斯** | VPN 法 | VPN 提供商必须注册并记录用户活动 |
| **澳大利亚** | 隐私法 | 通过代理收集数据受隐私原则约束 |

**GDPR 特定考量：**

**作为个人数据的 IP 地址 (第 4 条)：**

通过代理抓取位于欧盟的网站时：

- 您的代理在欧盟的 IP 被视为个人数据
- 网站必须按照 GDPR 要求处理它
- 您必须有合法的数据收集依据
- 适用数据最小化原则

**处理的合法依据 (第 6 条)：**

1.  **同意** - 难以通过抓取获得
2.  **合同** - 如果您是客户，则是合法的
3.  **法律义务** - 罕见于抓取用例
4.  **重大利益** - 不适用于抓取
5.  **公共任务** - 不适用于抓取
6.  **合法利益** - 最适用于抓取 (需要进行平衡测试)

### 服务条款和访问限制

代理不能使您免于遵守网站的服务条款 (ToS)：

**常见的 ToS 违规行为：**

1.  **自动访问**：许多网站禁止机器人/抓取工具，无论 IP 如何
2.  **规避速率限制**：使用旋转代理绕过速率限制
3.  **地理限制**：绕过地理封锁可能违反内容许可协议
4.  **账户共享**：使用代理将多个用户伪装成一个

**法律先例示例：**

```python
# 著名案例 (简化，非法律建议)
cases = {
    'hiQ Labs v. LinkedIn (2022)': {
        'issue': '在访问被撤销后抓取公共数据',
        'outcome': '抓取公开可用的数据通常是允许的',
        'caveat': '但规避技术壁垒可能违反 CFAA'
    },
    
    'QVC v. Resultly (2020)': {
        'issue': '侵略性抓取导致服务器负载',
        'outcome': '过度请求构成对动产的侵犯',
        'implication': '重要的是数量和影响，而不仅仅是技术访问'
    }
}
```

### 代理使用的道德准则

除了法律合规性，还应考虑以下道德原则：

**1. 尊重 robots.txt**
```python
# 即使使用代理，也要遵守网站准则
async def ethical_scraping(url):
    # 无论代理匿名性如何，都要检查 robots.txt
    if not is_allowed_by_robots(url):
        return None  # 尊重网站的意愿
```

**2. 速率限制**
```python
# 不要滥用代理轮换来压垮服务器
MINIMUM_DELAY = 1.0  # 请求之间的最小延迟（秒）
MAX_CONCURRENT = 5   # 每个站点的最大并发连接数

# 错误：轮换代理以 1000 请求/秒的速度抓取
# 正确：即使使用代理轮换，也要进行友好的抓取
```

**3. 透明度**
```python
# 在适当的时候在 User-Agent 中标识自己
headers = {
    'User-Agent': 'MyBot/1.0 (contact@example.com)',  # 诚实的标识
    # 而不是: 'Mozilla/5.0...'  # 在不是浏览器时具有欺骗性
}
```

**4. 数据最小化**
```python
# 只收集您需要的数据
# 仅仅因为您可以抓取所有内容，并不意味着您应该这样做
data_to_collect = {
    'product_name': True,
    'price': True,
    'user_emails': False,      # PII - 除非必要，否则不要收集
    'user_addresses': False,   # PII - 隐私问题
}
```

### 合规性清单

在部署基于代理的自动化之前：

- [ ] **法律审查**：咨询您所在司法管辖区的法律顾问
- [ ] **ToS 合规性**：审查目标网站的服务条款
- [ ] **数据保护**：如果处理个人数据，确保符合 GDPR/CCPA
- [ ] **访问权限**：验证您有权访问数据
- [ ] **速率限制**：实施友好的请求速率
- [ ] **错误处理**：适当处理 429 (请求过多)
- [ ] **日志记录**：保留审计跟踪以用于合规性目的
- [ ] **数据保留**：实施适当的数据保留/删除策略
- [ ] **安全**：采取适当措施保护收集的数据
- [ ] **透明度**：在被问及时，诚实说明您的抓取活动

!!! warning "这不是法律建议"
    本节仅提供一般信息。代理使用的合法性因司法管辖区、上下文和具体情况而异。请务必就您的具体情况咨询合格的法律顾问。

!!! tip "负责任的代理使用"
    最站得住脚的代理用法是：
    
    - **透明**：您可以解释为什么这么做
    - **必要**：您有合法的理由 (研究、监控等)
    - **相称**：您的方法与您的需求相匹配 (不过度)
    - **有记录**：您保留了您的活动记录
    - **合规**：您遵守所有适用的法律和 ToS

### 何时避免使用代理

在某些情况下，使用代理是有问题的：

| 场景 | 风险 | 替代方案 |
|---|---|---|
| **银行/金融网站** | 欺诈检测, 账户暂停 | 仅使用合法访问 |
| **政府门户网站** | 法律处罚, 安全调查 | 从授权位置直接访问 |
| **医疗保健数据** | 违反 HIPAA, 严厉处罚 | 使用授权的 API 访问 |
| **内部企业系统** | 违反政策, 终止雇佣 | 遵守公司 IT 政策 |
| **电子商务账户创建** | 欺诈标记, 永久封禁 | 使用单一、已验证的身份 |

## 结论

深入了解代理架构使您能够：

**做出明智的决策：**
- 为您的用例选择正确的代理类型
- 了解安全隐患
- 确定何时代理是必要的 vs 可选的

**有效地进行故障排除：**
- 调试连接问题
- 识别 DNS 泄露或 IP 泄露
- 诊断性能问题

**优化性能：**
- 配置适当的超时
- 实现连接池
- 监控代理健康状况

**构建更好的自动化：**
- 将代理与反检测技术相结合
- 实现健壮的错误处理
- 高效地扩展代理使用

代理领域是复杂的，但有了这个基础，您就具备了成功驾驭它的能力。

## 进一步阅读

- **[RFC 1928](https://tools.ietf.org/html/rfc1928)**: SOCKS5 协议规范
- **[RFC 1929](https://tools.ietf.org/html/rfc1929)**: SOCKS5 用户名/密码身份验证
- **[RFC 2616](https://tools.ietf.org/html/rfc2616)**: HTTP/1.1 (CONNECT 方法)
- **[RFC 5389](https://tools.ietf.org/html/rfc5389)**: STUN 协议
- **[RFC 9298](https://tools.ietf.org/html/rfc9298)**: CONNECT-UDP (HTTP/3 代理)
- **[代理配置指南](../features/configuration/proxy.md)**: 实用的 Pydoll 代理用法、身份验证、轮换和测试
- **[请求拦截](../features/network/interception.md)**: Pydoll 内部如何实现代理身份验证
- **[网络能力深度探讨](./network-capabilities.md)**: Pydoll 如何处理网络操作

!!! tip "实验"
    真正理解代理的最好方法是：
    
    1. 建立您自己的代理服务器 (使用上面的代码)
    2. 使用 Wireshark 捕获流量以查看原始数据包
    3. 使用真实的自动化测试不同类型的代理
    4. 故意制造泄露并学会检测它们
    
    亲身实践能巩固理论知识！

================================================
FILE: docs/zh/deep-dive/network/socks-proxies.md
================================================
# SOCKS 协议架构

SOCKS（SOCKet Secure）是一种运行在网络栈传输层和应用层之间的代理协议（通常被描述为 OSI 模型的第 5 层）。与解析和理解 HTTP 流量的 HTTP 代理不同，SOCKS 代理在不检查内容的情况下转发原始 TCP 和 UDP 连接。这种协议无关的设计使 SOCKS 成为注重隐私的自动化的首选：代理无需解析您的请求、注入标头或终止 TLS 连接。

本文档涵盖了 SOCKS 在协议层面的工作原理、SOCKS4 与 SOCKS5 的区别、Chrome 中的身份验证处理、DNS 解析行为，以及在 Pydoll 中的实际配置。

!!! info "模块导航"
    - [HTTP/HTTPS 代理](./http-proxies.md)：应用层代理
    - [网络基础](./network-fundamentals.md)：TCP/IP、UDP、OSI 模型
    - [网络与安全概述](./index.md)：模块介绍
    - [代理检测](./proxy-detection.md)：匿名级别和检测规避
    - [构建代理](./build-proxy.md)：从零开始实现 SOCKS5

    有关实际配置，请参阅[代理配置](../../features/configuration/proxy.md)。

## SOCKS 与 HTTP 代理的区别

根本区别在于每种代理能看到和做到什么。HTTP 代理在应用层运行，理解 HTTP：它可以读取 URL、标头、Cookie 和请求体（针对未加密流量），在传输过程中修改它们，缓存响应，并注入自己的标头，如 `Via` 和 `X-Forwarded-For`。这对内容过滤很有用，但意味着您必须信任代理运营商处理您的应用数据。

SOCKS 代理在应用层之下运行。它只能看到目标地址、端口和正在传输的数据量。它不会解析、修改甚至理解通过它流动的是什么协议。HTTP、HTTPS、FTP、SSH、WebSocket 或任何自定义协议对于 SOCKS 代理来说都是一样的：只是在两个端点之间中继的字节流。

这有一个直接的实际影响。当您通过 SOCKS5 代理发送 HTTPS 请求时，代理看到的是 `example.com:443` 和加密的 TLS 流。它无法读取 URL、标头、Cookie 或响应内容。它不会添加识别性标头。它不需要终止 TLS。加密隧道在您的浏览器和目标服务器之间是端到端的。

然而，理解 SOCKS 不提供什么同样重要。SOCKS 是一种代理协议，而不是加密协议。"SOCKet Secure"这个名称指的是安全的防火墙穿越，而非密码学安全。如果您通过 SOCKS5 代理发送未加密的 HTTP 流量，即使代理并非设计用来检查流量，代理运营商也能读取通过的字节。要实现真正的加密，您需要在 SOCKS 之上使用 TLS/HTTPS，或者用加密隧道（SSH、VPN）包裹 SOCKS 连接。

!!! note "信任模型"
    使用 HTTP 代理时，您信任代理运营商不会记录您的浏览历史、窃取令牌、修改响应或执行 MITM 攻击。使用 SOCKS5 时，您只需信任代理能正确转发数据包且不记录连接元数据。攻击面更小，但并非为零。

## SOCKS4 与 SOCKS5

SOCKS 有两个常用版本。SOCKS4 由 NEC 在 20 世纪 90 年代初开发，是一个没有 RFC 的非正式标准。SOCKS5 于 1996 年被标准化为 RFC 1928，以解决 SOCKS4 的局限性。

| 特性 | SOCKS4 | SOCKS5 |
|---------|--------|--------|
| 标准 | 无官方 RFC（1992 年的事实标准） | RFC 1928（1996） |
| 身份验证 | 仅标识（USERID 字段，无密码） | 多种方法（无认证、用户名/密码、GSSAPI） |
| IP 版本 | 仅 IPv4 | IPv4 和 IPv6 |
| UDP 支持 | 否 | 是（UDP ASSOCIATE 命令） |
| DNS 解析 | 客户端（SOCKS4A 扩展添加了服务器端） | 使用域名时由服务器端解析（ATYP=0x03） |
| 协议支持 | 仅 TCP | TCP 和 UDP |

SOCKS5 在各方面都更优越。仅在代理不支持 SOCKS5 时才使用 SOCKS4。

## SOCKS5 握手

SOCKS5 连接过程遵循 RFC 1928，由三个阶段组成：方法协商、可选的身份验证和连接请求。

```mermaid
sequenceDiagram
    participant Client
    participant SOCKS5 as SOCKS5 Proxy
    participant Server as Target Server

    Note over Client,SOCKS5: Phase 1: Method Negotiation
    Client->>SOCKS5: Hello [VER=5, NMETHODS, METHODS]
    SOCKS5->>Client: Method Selected [VER=5, METHOD]

    Note over Client,SOCKS5: Phase 2: Authentication (if required)
    Client->>SOCKS5: Auth Request [VER=1, ULEN, UNAME, PLEN, PASSWD]
    SOCKS5->>Client: Auth Response [VER=1, STATUS]

    Note over Client,SOCKS5: Phase 3: Connection Request
    Client->>SOCKS5: Connect [VER=5, CMD=CONNECT, DST.ADDR, DST.PORT]
    SOCKS5->>Server: Establish TCP connection
    Server-->>SOCKS5: Connection established
    SOCKS5->>Client: Reply [VER=5, REP=SUCCESS, BND.ADDR, BND.PORT]

    Note over Client,Server: Data relay (proxied)
    Client->>SOCKS5: Application data
    SOCKS5->>Server: Forward data
    Server->>SOCKS5: Response data
    SOCKS5->>Client: Forward response
```

### 阶段 1：方法协商

客户端打开一个到代理的 TCP 连接，发送一个包含协议版本（SOCKS5 始终为 `0x05`）和支持的身份验证方法列表的问候消息。

```python
# Client Hello
[
    0x05,        # VER: Protocol version (5)
    0x02,        # NMETHODS: Number of methods offered
    0x00, 0x02   # METHODS: No auth (0x00) and Username/Password (0x02)
]
```

代理回复它选择的方法。如果代理需要身份验证且客户端提供了 `0x02`（用户名/密码），代理就选择它。如果没有提供可接受的方法，代理回复 `0xFF` 并关闭连接。

```python
# Server response
[
    0x05,   # VER: Protocol version (5)
    0x02    # METHOD: Username/Password selected
]
```

RFC 1928 定义的方法代码：`0x00` = 无身份验证，`0x01` = GSSAPI，`0x02` = 用户名/密码（RFC 1929），`0x03-0x7F` = IANA 分配，`0x80-0xFE` = 保留给私有方法，`0xFF` = 无可接受的方法。

### 阶段 2：身份验证

如果代理选择了方法 `0x02`，客户端按照 RFC 1929 发送凭据。子协商使用自己的版本号（`0x01`，而非 `0x05`）。

```python
# Client authentication
[
    0x01,              # VER: Subnegotiation version (1)
    len(username),     # ULEN: Username length (max 255)
    *username_bytes,   # UNAME: Username
    len(password),     # PLEN: Password length (max 255)
    *password_bytes    # PASSWD: Password
]

# Server response
[
    0x01,   # VER: Subnegotiation version (1)
    0x00    # STATUS: 0 = success, non-zero = failure
]
```

在此握手过程中，凭据以明文传输。这是 SOCKS5 协议（RFC 1929）固有的特性。对于敏感环境，请将 SOCKS 连接包裹在 SSH 隧道或 VPN 中。

### 阶段 3：连接请求

身份验证成功后（或者不需要身份验证时），客户端发送一个连接请求，指定命令、目标地址和端口。

```python
[
    0x05,          # VER: Protocol version (5)
    0x01,          # CMD: 1=CONNECT, 2=BIND, 3=UDP ASSOCIATE
    0x00,          # RSV: Reserved
    0x03,          # ATYP: 1=IPv4 (4 bytes), 3=Domain (length+name), 4=IPv6 (16 bytes)
    len(domain),   # Domain length (only for ATYP=0x03)
    *domain_bytes, # Domain name
    *port_bytes    # Port (2 bytes, big-endian)
]
```

地址类型（ATYP）决定了格式：`0x01` 表示后面跟 4 字节的 IPv4 地址，`0x04` 表示 16 字节的 IPv6 地址，`0x03` 表示一个长度字节后跟域名。当客户端发送域名（ATYP=0x03）时，代理在其侧解析 DNS，这可以防止 DNS 泄露到客户端的本地网络。

代理连接到目标并回复：

```python
[
    0x05,       # VER: Protocol version (5)
    0x00,       # REP: 0x00=success, 0x01-0x08=various errors
    0x00,       # RSV: Reserved
    0x01,       # ATYP: Address type of bound address
    *bind_addr, # BND.ADDR: Address the proxy bound to
    *bind_port  # BND.PORT: Port the proxy bound to
]
```

回复代码：`0x00` 成功，`0x01` 一般性故障，`0x02` 不允许连接，`0x03` 网络不可达，`0x04` 主机不可达，`0x05` 连接被拒绝，`0x06` TTL 过期，`0x07` 不支持的命令，`0x08` 不支持的地址类型。

成功回复后，代理开始双向中继数据。整个 SOCKS5 握手是二进制协议，比基于文本的 HTTP 更高效，但没有十六进制转储就更难调试。

## UDP 支持

SOCKS5 通过 `UDP ASSOCIATE` 命令（CMD=0x03）支持 UDP 代理。其工作方式与 TCP 代理不同：客户端通过 TCP 控制连接发送 UDP ASSOCIATE 请求，代理回复中继地址和端口。然后客户端将 UDP 数据报发送到该中继，代理将其转发到目标。

```mermaid
sequenceDiagram
    participant Client
    participant SOCKS5
    participant UDP_Server as UDP Server

    Note over Client,SOCKS5: TCP control connection (handshake + auth)
    Client->>SOCKS5: UDP ASSOCIATE request (CMD=0x03)
    SOCKS5->>Client: Relay address and port

    Note over Client,SOCKS5: UDP data transfer
    Client->>SOCKS5: UDP datagram to relay
    SOCKS5->>UDP_Server: Forward datagram
    UDP_Server->>SOCKS5: Response datagram
    SOCKS5->>Client: Forward response

    Note over Client,SOCKS5: TCP control connection stays open
```

通过中继发送的每个 UDP 数据报都包含一个带有目标地址和端口的小标头：

```python
[
    0x00, 0x00,    # RSV: Reserved
    0x00,          # FRAG: Fragment number (0 = no fragmentation)
    0x01,          # ATYP: Address type
    *dst_addr,     # DST.ADDR: Destination address
    *dst_port,     # DST.PORT: Destination port
    *data          # DATA: Application data
]
```

TCP 控制连接在 UDP 关联期间必须保持打开。如果它关闭，代理会丢弃 UDP 中继。

!!! warning "Chrome 中的 UDP"
    Chrome 不会为任何流量使用 SOCKS5 UDP ASSOCIATE。即使配置了 SOCKS5 代理，Chrome 也只代理 TCP 连接。WebRTC、DNS-over-UDP 和其他 UDP 流量不会通过 SOCKS5 代理路由。这意味着在 Chrome 中使用 SOCKS5 时仍可能存在 WebRTC IP 泄露。使用 `--force-webrtc-ip-handling-policy=disable_non_proxied_udp` 或 Pydoll 的 `webrtc_leak_protection = True` 来缓解此问题。更多详情请参阅 [网络基础：WebRTC 和 IP 泄露](./network-fundamentals.md#webrtc-and-ip-leakage)。

!!! tip "现代 UDP 代理替代方案"
    对于需要超出 Chrome SOCKS5 实现所提供的完整 UDP 支持的场景，可以考虑 Shadowsocks（带有原生 UDP 的加密类 SOCKS 协议）、WireGuard（性能出色的 VPN）或 V2Ray/VMess（具有全面 UDP 处理能力的灵活代理框架）。

## DNS 解析

一个常见的误解是 HTTP 代理会泄露 DNS 查询，而 SOCKS5 代理不会。Chrome 中的实际情况更加微妙。

当 Chrome 配置了任何代理（HTTP、HTTPS 或 SOCKS5）时，它会将主机名发送给代理，而不是在本地解析 DNS。对于 HTTP 代理，主机名出现在 `CONNECT host:443` 请求中。对于 SOCKS5，它出现在带有 ATYP=0x03（域名）的连接请求中。在这两种情况下，代理在其侧解析 DNS，Chrome 不会对代理流量进行本地 DNS 查询。

两种代理类型之间真正的 DNS 隐私差异不在于谁解析 DNS，而在于代理在应用层能看到什么。HTTP 代理能看到未加密请求的完整 URL 和 CONNECT 请求的主机名。SOCKS5 代理只能看到目标主机名和端口作为不透明的连接参数。

但是，有一个重要的注意事项：即使配置了代理，Chrome 的 DNS 预取器也可能会对页面内容中发现的主机名进行本地 DNS 查询。这可能会将您正在浏览的域名泄露给本地 DNS 解析器。要防止这种情况，请禁用 DNS 预取或使用标志 `--host-resolver-rules="MAP * ~NOTFOUND , EXCLUDE 127.0.0.1"`。

!!! note "`socks5://` 与 `socks5h://`"
    Chrome 之外的许多工具区分 `socks5://`（客户端解析 DNS）和 `socks5h://`（代理解析 DNS，"h"代表 hostname）。Chrome 对 SOCKS5 始终在代理侧解析 DNS，无论您使用哪种方案，行为都类似于 `socks5h://`。但如果您在 Pydoll 之外使用 `curl`、Firefox 或 Python 库等工具，这个区别就很重要：请始终使用 `socks5h://` 以防止 DNS 泄露。

## SOCKS5 与 MITM 抵抗

SOCKS5 经常被描述为"抗 MITM"。在特定意义上这是正确的：因为 SOCKS5 不理解或与 TLS 交互，它没有机制来终止 TLS 连接并重新加密。SOCKS5 代理只是原样中继加密的字节。

相比之下，HTTP 代理可以通过向客户端提供自己的证书来执行 TLS 终止（MITM），解密流量、检查或修改内容，然后重新加密发送给服务器。这需要客户端信任代理的 CA 证书，并且可以通过证书固定和证书透明度日志检测到。HTTP 代理处理 HTTPS 的正常行为（使用 CONNECT）是创建透明隧道而不终止 TLS，但 MITM 的架构可能性是存在的。

使用 SOCKS5 时，TLS 终止在协议层面是不可能的。代理无法将自己注入 TLS 握手，因为它不解析流经的应用数据。客户端和服务器之间的端到端加密在设计上得到了保护。

值得注意的是，提供实际密码学保护的是 TLS，而不是 SOCKS5 本身。如果您通过 SOCKS5 代理发送未加密的 HTTP，代理运营商可以读取所有内容。SOCKS5 的安全优势是架构性的（它不需要也不启用 TLS 终止），而非密码学意义上的。

## TLS 和通过 SOCKS5 的浏览器 fingerprinting

一个需要理解的重要局限：SOCKS5 不会改变浏览器的 fingerprint。TLS 握手（ClientHello）逐字节通过 SOCKS5 代理传递，这意味着目标服务器能看到浏览器的确切 JA3/JA4 fingerprint。HTTP/2 SETTINGS 帧、浏览器特有的标头排序以及所有其他应用层 fingerprinting 信号同样如此。

SOCKS5 隐藏了您的 IP 地址并防止代理注入识别性标头。但它对任何形式的浏览器或行为 fingerprinting 都没有帮助。要实现完整的规避策略，您需要在多个层面应对 fingerprinting。详情请参阅[规避技术](../fingerprinting/evasion-techniques.md)。

## Chrome 中的 SOCKS5 身份验证

Chrome 不支持 SOCKS5 用户名/密码身份验证。这是一个长期存在的限制，跟踪为 [Chromium Issue #40323993](https://issues.chromium.org/issues/40323993)。当 Chrome 执行 SOCKS5 方法协商时，它只提供方法 `0x00`（无身份验证）。如果代理需要身份验证，连接会静默失败。

这与 HTTP 代理身份验证有本质区别。HTTP 代理通过 HTTP 状态码（`407 Proxy Authentication Required`）进行身份验证，Chrome 通过 CDP 中的 Fetch 域来处理。Pydoll 拦截这些 `Fetch.authRequired` 事件并自动使用存储的凭据响应。而 SOCKS5 身份验证发生在会话层的二进制协议握手期间，在任何 HTTP 流量存在之前。没有 HTTP 407，没有 `Fetch.authRequired` 事件，基于 CDP 的工具也无法将凭据注入此过程。

配置 `--proxy-server=socks5://user:pass@proxy:1080` 不会生效。Chrome 会静默忽略嵌入的凭据。

### Pydoll 的 SOCKS5Forwarder

标准解决方案是本地代理转发器：一个运行在 localhost 上的轻量级 SOCKS5 服务器，接受来自 Chrome 的未认证连接，并将其转发到带有完整身份验证的远程代理。

```mermaid
sequenceDiagram
    participant Chrome
    participant Forwarder as Local Forwarder<br/>(127.0.0.1:1081)
    participant Remote as Remote SOCKS5 Proxy<br/>(proxy:1080)
    participant Server as Destination Server

    Note over Chrome,Forwarder: No authentication
    Chrome->>Forwarder: SOCKS5 Hello [methods: 0x00]
    Forwarder->>Chrome: Method selected [0x00]
    Chrome->>Forwarder: CONNECT example.com:443

    Note over Forwarder,Remote: With authentication
    Forwarder->>Remote: SOCKS5 Hello [methods: 0x02]
    Remote->>Forwarder: Method selected [0x02]
    Forwarder->>Remote: Auth [username, password]
    Remote->>Forwarder: Auth OK
    Forwarder->>Remote: CONNECT example.com:443
    Remote->>Server: TCP connection
    Remote->>Forwarder: Connect OK

    Forwarder->>Chrome: Connect OK

    Note over Chrome,Server: Bidirectional data relay
    Chrome->>Forwarder: TLS + application data
    Forwarder->>Remote: Forward
    Remote->>Server: Forward
    Server->>Remote: Response
    Remote->>Forwarder: Forward
    Forwarder->>Chrome: Forward
```

Pydoll 在 `pydoll.utils` 模块中提供了内置的 `SOCKS5Forwarder`。这是一个纯 Python、零依赖的异步实现，处理与远程代理的完整 SOCKS5 握手，包括用户名/密码身份验证（RFC 1929）、IPv4、IPv6 和域名地址类型。

```python
import asyncio
from pydoll.utils import SOCKS5Forwarder
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def main():
    forwarder = SOCKS5Forwarder(
        remote_host='proxy.example.com',
        remote_port=1080,
        username='myuser',
        password='mypass',
        local_port=1081,  # Use 0 for auto-assigned port
    )
    async with forwarder:
        options = ChromiumOptions()
        options.add_argument(f'--proxy-server=socks5://127.0.0.1:{forwarder.local_port}')

        async with Chrome(options=options) as browser:
            tab = await browser.start()
            await tab.go_to('https://httpbin.org/ip')

asyncio.run(main())
```

转发器也可以作为独立的 CLI 工具运行，用于测试或与其他应用配合使用：

```bash
python -m pydoll.utils.socks5_proxy_forwarder \
    --remote-host proxy.example.com \
    --remote-port 1080 \
    --username myuser \
    --password mypass \
    --local-port 1081
```

转发器默认绑定到 `127.0.0.1`，使其只能从本机访问。切勿在生产环境中绑定到 `0.0.0.0`，因为这会向网络暴露一个未认证的 SOCKS5 代理。凭据永远不会以明文记录到日志中。由于所有通信都通过本地回环接口进行，转发器增加的延迟不到一毫秒。

!!! tip "受限环境"
    某些环境（Docker 容器、无服务器平台、加固的虚拟机）可能会限制绑定到本地端口。使用 `local_port=0` 让操作系统分配一个可用端口。如果本地绑定完全被阻止，请考虑使用 HTTP CONNECT 代理，Chrome 通过 Pydoll 的 ProxyManager 原生支持其身份验证。

## 实际配置

**基本 SOCKS5（无身份验证）：**

```python
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.add_argument('--proxy-server=socks5://proxy.example.com:1080')

async with Chrome(options=options) as browser:
    tab = await browser.start()
    await tab.go_to('https://example.com')
```

**带身份验证的 SOCKS5（通过 SOCKS5Forwarder）：**

请参阅上面的 [SOCKS5Forwarder 章节](#pydolls-socks5forwarder)。

**防止泄露：**

要建立完整的 SOCKS5 配置，您还应该防止 WebRTC 和 DNS 预取泄露：

```python
options = ChromiumOptions()
options.add_argument('--proxy-server=socks5://proxy.example.com:1080')
options.webrtc_leak_protection = True  # Prevents WebRTC IP leaks
options.add_argument('--disable-quic')  # Forces HTTP/2 over TCP through proxy
```

**测试您的配置：**

始终通过泄露测试验证您的代理配置。访问 [browserleaks.com/ip](https://browserleaks.com/ip) 确认您的 IP，访问 [browserleaks.com/webrtc](https://browserleaks.com/webrtc) 检查 WebRTC 泄露，访问 [dnsleaktest.com](https://dnsleaktest.com/) 验证 DNS 是否泄露。

## 总结

SOCKS5 提供协议无关的代理，与 HTTP 代理相比具有更小的信任面。它不会解析、修改或向您的流量注入任何内容。在 Chrome 中，DNS 解析在代理侧进行。TLS 加密端到端保持不变。Chrome 中的主要限制是缺乏原生 SOCKS5 身份验证（通过 Pydoll 的 `SOCKS5Forwarder` 解决）以及不支持 UDP 代理（通过禁用 WebRTC 或使用适当的浏览器标志来缓解）。

SOCKS5 不会改变浏览器的 TLS fingerprint、HTTP/2 设置或任何应用层特征。要实现完整的规避，请将 SOCKS5 与浏览器 fingerprint 管理和行为模拟相结合。

**后续步骤：**

- [代理检测](./proxy-detection.md)：即使 SOCKS5 代理也可能被检测到
- [构建代理](./build-proxy.md)：实现您自己的 SOCKS5 服务器
- [代理配置](../../features/configuration/proxy.md)：Pydoll 代理的实际设置
- [规避技术](../fingerprinting/evasion-techniques.md)：多层规避策略

## 参考资料

- RFC 1928: SOCKS Protocol Version 5 (1996) - https://datatracker.ietf.org/doc/html/rfc1928
- RFC 1929: Username/Password Authentication for SOCKS V5 (1996) - https://datatracker.ietf.org/doc/html/rfc1929
- RFC 1961: GSS-API Authentication Method for SOCKS V5 (1996) - https://datatracker.ietf.org/doc/html/rfc1961
- RFC 3089: SOCKS-based IPv6/IPv4 Gateway Mechanism (2001) - https://datatracker.ietf.org/doc/html/rfc3089
- Chromium Proxy Documentation - https://chromium.googlesource.com/chromium/src/+/689912289c/net/docs/proxy.md
- Chromium Issue #40323993: SOCKS5 Authentication - https://issues.chromium.org/issues/40323993
- BrowserLeaks: WebRTC Leak Test - https://browserleaks.com/webrtc
- DNS Leak Test - https://dnsleaktest.com/
- IPLeak: Comprehensive Leak Testing - https://ipleak.net


================================================
FILE: docs/zh/features/advanced/behavioral-captcha-bypass.md
================================================
# Cloudflare Turnstile 交互

Pydoll 通过执行真实的浏览器点击，为与 Cloudflare Turnstile 验证码交互提供原生支持。这**不是绕过或规避**。它只是自动化人类在验证码复选框上执行的相同点击操作。

!!! warning "此功能实际做什么"
    此功能使用标准浏览器交互**点击** Cloudflare Turnstile 验证码复选框。就这样。没有：
    
    - **没有**：魔法绕过或规避
    - **没有**：挑战解决（图像选择、拼图等）
    - **没有**：分数操纵或指纹欺骗
    - **有**：只是对验证码容器的真实点击
    
    **成功完全取决于您的环境**（IP 声誉、浏览器指纹、行为模式）。Pydoll 提供点击机制；您的环境决定点击是否被接受。

!!! info "什么是 Cloudflare Turnstile？"
    Cloudflare Turnstile 是一个现代验证码系统，它分析浏览器环境和行为信号来判断您是否是人类。它通常显示为用户必须点击的复选框。系统分析：
    
    - **IP 声誉**：您的 IP 地址是否被标记或可疑？
    - **浏览器指纹**：您的浏览器看起来合法吗？
    - **行为模式**：您的行为像人类吗？
    
    当信任分数足够高时，复选框点击被接受。当分数太低时，Turnstile 可能会显示挑战（Pydoll **无法解决**）或完全阻止您。对于图像或拼图挑战，可以考虑使用 **[CapSolver](https://dashboard.capsolver.com/passport/register?inviteCode=WPhTbOsbXEpc)**。

## 快速开始

### 上下文管理器（推荐）

上下文管理器等待验证码出现，点击它，并在继续之前等待解决：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def turnstile_example():
    options = ChromiumOptions()
    options.add_argument('--disable-blink-features=AutomationControlled')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # 上下文管理器自动处理验证码
        async with tab.expect_and_bypass_cloudflare_captcha():
            await tab.go_to('https://site-with-turnstile.com')
        
        # 此代码仅在验证码被点击后运行
        print("Turnstile 验证码交互完成！")
        
        # 继续您的自动化
        content = await tab.find(id='protected-content')
        print(await content.text)

asyncio.run(turnstile_example())
```

### 后台处理

在后台启用自动验证码点击：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def background_turnstile():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # 在导航前启用自动点击
        await tab.enable_auto_solve_cloudflare_captcha()
        
        # 导航到受保护的站点
        await tab.go_to('https://site-with-turnstile.com')
        
        # 等待验证码在后台处理
        await asyncio.sleep(5)
        
        print("页面加载完成，后台处理验证码")
        
        # 不再需要时禁用
        await tab.disable_auto_solve_cloudflare_captcha()

asyncio.run(background_turnstile())
```

## 自定义验证码交互

### 工作原理

Pydoll 通过遍历页面的 shadow DOM 自动检测 Cloudflare Turnstile。它查找包含 `challenges.cloudflare.com` 的 shadow root，导航到其跨域 iframe，找到内部 shadow root，并点击实际的复选框元素。无需手动配置选择器。

### 时间配置

验证码的 shadow root 并不总是立即出现。调整超时以匹配站点的行为：

```python
async def timing_configuration_example():
    async with Chrome() as browser:
        tab = await browser.start()

        async with tab.expect_and_bypass_cloudflare_captcha(
            time_to_wait_captcha=10   # 等待最多 10 秒让验证码出现（默认：5）
        ):
            await tab.go_to('https://site-with-slow-turnstile.com')

        print("使用自定义时间完成验证码交互！")

asyncio.run(timing_configuration_example())
```

**参数参考：**

| 参数 | 类型 | 默认值 | 描述 |
|-----------|------|---------|-------------|
| `time_to_wait_captcha` | `float` | `5` | 等待验证码出现的最大秒数 |

!!! info "为什么时间很重要"
    某些站点异步加载验证码。如果 Cloudflare 的 shadow root 在 `time_to_wait_captcha` 时间内没有出现，交互将被跳过。

## 其他验证码系统

### reCAPTCHA v3（隐形）

reCAPTCHA v3 是**完全隐形的**，**不需要交互**。只需正常导航：

```python
async def recaptcha_v3_example():
    options = ChromiumOptions()
    options.add_argument('--disable-blink-features=AutomationControlled')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # 不需要特殊处理 - 只需导航
        await tab.go_to('https://site-with-recaptcha-v3.com')
        
        # reCAPTCHA v3 在后台运行，分析您的行为
        await asyncio.sleep(3)
        
        # 继续提交表单
        submit_button = await tab.find(id='submit-btn')
        await submit_button.click()

asyncio.run(recaptcha_v3_example())
```

!!! note "reCAPTCHA v3 成功因素"
    由于 reCAPTCHA v3 完全是被动的（无需交互），成功取决于：
    
    - **IP 声誉**：使用声誉良好的住宅代理
    - **浏览器指纹**：配置真实的浏览器首选项
    - **行为模式**：在页面上花费时间，自然滚动，真实打字
    
    如果您的分数太低，某些站点可能会显示 reCAPTCHA v2 挑战（Pydoll **无法解决**）。

## 什么决定成功？

验证码交互的成功**完全取决于您的环境**，而不是 Pydoll。验证码系统分析：

### 1. IP 声誉（最关键）

| IP 类型 | 信任级别 | 预期行为 |
|---------|-------------|-------------------|
| **住宅 IP（干净）** | 高 | 通常无需挑战即被接受 |
| **移动 IP** | 高 | 通常无需挑战即被接受 |
| **数据中心 IP** | 低 | 经常被阻止或挑战 |
| **先前被阻止的 IP** | 非常低 | 几乎总是被阻止或挑战 |

!!! danger "IP 声誉就是一切"
    **没有工具可以克服糟糕的 IP 地址。** 如果您的 IP 被标记，无论您的浏览器看起来多么真实，您都会被阻止或挑战。
    
    使用声誉良好的住宅代理以获得最佳结果。

### 2. 浏览器指纹

配置您的浏览器使其看起来合法：

```python
import time
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def stealth_configuration():
    options = ChromiumOptions()
    
    # 隐蔽参数
    options.add_argument('--disable-blink-features=AutomationControlled')
    options.add_argument('--window-size=1920,1080')
    
    # 真实的浏览器首选项
    current_time = int(time.time())
    options.browser_preferences = {
        'profile': {
            'last_engagement_time': str(current_time - (3 * 60 * 60)),  # 3 小时前
            'exited_cleanly': True,
            'exit_type': 'Normal',
        },
        'safebrowsing': {'enabled': True},
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        async with tab.expect_and_bypass_cloudflare_captcha():
            await tab.go_to('https://site-with-turnstile.com')

asyncio.run(stealth_configuration())
```

### 3. 行为模式

验证码系统分析您如何与页面交互：

```python
async def realistic_behavior():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://site-with-turnstile.com')
        
        # 在验证码出现之前模拟人类行为
        await asyncio.sleep(2)  # 阅读页面内容
        await tab.execute_script('window.scrollBy(0, 300)')  # 滚动
        await asyncio.sleep(1)
        
        # 现在与验证码交互
        async with tab.expect_and_bypass_cloudflare_captcha():
            # 验证码交互在这里发生
            pass
        
        print("使用真实行为通过验证码！")

asyncio.run(realistic_behavior())
```

!!! tip "行为指纹识别"
    要深入了解行为模式如何影响验证码成功，请参阅**[行为指纹识别](../../deep-dive/fingerprinting/behavioral-fingerprinting.md)**。本指南解释：
    
    - 鼠标移动模式和检测
    - 击键时间分析
    - 滚动行为物理学
    - 事件序列分析
    
    理解这些概念可以帮助您构建更真实的自动化，实现更高的成功率。

## 故障排除

### 验证码未被点击

**症状**：验证码出现但从未被点击，页面停留在挑战上。

**可能的原因：**

1. **时间太短**：Pydoll 尝试点击时验证码尚未加载
2. **Shadow root 未找到**：Cloudflare Turnstile 的 shadow root 尚未出现在 DOM 中

**解决方案：**

```python
async def troubleshooting_example():
    async with Chrome() as browser:
        tab = await browser.start()

        # 增加等待时间
        async with tab.expect_and_bypass_cloudflare_captcha(
            time_before_click=5,     # 点击前更长的延迟
            time_to_wait_captcha=15  # 更多时间查找验证码
        ):
            await tab.go_to('https://problematic-site.com')

asyncio.run(troubleshooting_example())
```

### 验证码被点击但显示挑战

**症状**：复选框短暂显示勾号，然后呈现图像/拼图挑战。

**根本原因**：您的环境的信任分数太低。

**解决方案：**

- 使用声誉良好的住宅代理
- 配置真实的浏览器指纹
- 添加更真实的行为模式（滚动、鼠标移动、延迟）
- **注意**：Pydoll 无法自行解决挑战 — 如果您需要自动验证码解决，请考虑集成 **[CapSolver](https://dashboard.capsolver.com/passport/register?inviteCode=WPhTbOsbXEpc)**

### "访问被拒绝"或立即阻止

**症状**：站点立即显示"访问被拒绝"或阻止您而不显示验证码。

**根本原因**：**您的 IP 地址被标记。**

**解决方案：**

- 使用声誉良好的不同住宅代理
- 在请求之间轮换 IP
- 在 `https://www.cloudflare.com/cdn-cgi/trace` 测试您的 IP
- **注意**：再多的浏览器配置都无法修复被标记的 IP

### 在本地工作但在 Docker/CI 中失败

**症状**：验证码交互在您的机器上工作，但在 Docker/CI 环境中失败。

**根本原因**：验证码系统严格审查数据中心 IP。

**解决方案：**

1. **使用带有适当显示的无头模式**（用于完全渲染）：
   ```dockerfile
   FROM python:3.11-slim
   
   RUN apt-get update && apt-get install -y \
       chromium \
       chromium-driver \
       xvfb \
       && rm -rf /var/lib/apt/lists/*
   
   ENV DISPLAY=:99
   
   CMD Xvfb :99 -screen 0 1920x1080x24 & python your_script.py
   ```

2. **即使在 CI/CD 中也使用住宅代理**：
   ```python
   options = ChromiumOptions()
   options.add_argument('--proxy-server=http://user:pass@residential-proxy.com:8080')
   ```

## 最佳实践

1. **使用住宅代理**：IP 声誉是最关键的因素
2. **配置隐蔽选项**：移除自动化指示器
3. **添加行为模式**：点击前滚动、等待、移动鼠标
4. **调整时间**：在尝试点击之前给验证码加载时间
5. **优雅地处理失败**：当无法通过验证码时有备用逻辑
6. **测试您的环境**：在自动化前验证 IP 声誉和浏览器指纹

## 道德准则

!!! danger "服务条款和法律合规"
    即使技术上可行，与验证码交互也可能违反网站的服务条款。在自动化任何网站之前**始终检查并尊重服务条款**。
    
    此功能仅用于**合法的自动化目的**：
    
    **适当的用例：**
    - 对您自己的应用程序进行自动化测试
    - 监控您有权监控的服务
    - 具有适当授权的研究和安全分析
    
    **不适当的用例：**
    - 抓取您无权访问的内容
    - 规避付费墙或订阅系统
    - 拒绝服务攻击或激进抓取
    - 任何违反服务条款的活动

## 另请参阅

- **[浏览器选项](../configuration/browser-options.md)** - 隐蔽配置
- **[浏览器首选项](../configuration/browser-preferences.md)** - 高级指纹识别
- **[代理配置](../configuration/proxy.md)** - 设置代理
- **[行为指纹识别](../../deep-dive/fingerprinting/behavioral-fingerprinting.md)** - 理解行为检测
- **[类人交互](../automation/human-interactions.md)** - 真实的行为模式

---

**记住**：Pydoll 提供点击验证码的机制，但您的环境（IP、指纹、行为）决定成功。这不是魔法解决方案，它是在正确的环境和适当配置下使用的工具。对于需要图像识别或拼图解决的挑战，可以考虑使用 **[CapSolver](https://dashboard.capsolver.com/passport/register?inviteCode=WPhTbOsbXEpc)** — 使用代码 **PYDOLL** 获得额外 6% 余额奖励。

================================================
FILE: docs/zh/features/advanced/decorators.md
================================================
# Retry 装饰器

网页爬虫本质上是不可预测的。网络故障、页面加载缓慢、元素出现和消失、触发速率限制以及意外出现的验证码。`@retry` 装饰器提供了一个经过实战测试的强大解决方案，能够优雅地处理这些不可避免的故障。

## 为什么使用 Retry 装饰器？

在生产环境的爬虫中，故障不是例外——而是常态。与其让整个爬虫任务因为临时的网络故障或缺失的元素而崩溃，retry 装饰器允许您：

- **自动恢复** 临时性故障
- **实施复杂的重试策略** 使用指数退避
- **在重试前执行恢复逻辑** （刷新页面、切换代理、重启浏览器）
- **保持业务逻辑清晰** 不会被错误处理代码污染

## 快速开始

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.decorators import retry
from pydoll.exceptions import WaitElementTimeout, NetworkError

@retry(max_retries=3, exceptions=[WaitElementTimeout, NetworkError])
async def scrape_product_page(url: str):
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to(url)
        
        # 这可能因网络问题或加载缓慢而失败
        product_title = await tab.find(class_name='product-title', timeout=5)
        return await product_title.text

asyncio.run(scrape_product_page('https://example.com/product/123'))
```

如果 `scrape_product_page` 因 `WaitElementTimeout` 或 `NetworkError` 失败，它将自动重试最多 3 次才会放弃。

## 最佳实践：始终指定异常

!!! warning "关键最佳实践"
    **始终** 指定应该触发重试的异常。使用默认的 `exceptions=Exception` 会捕获 **所有** 异常，包括应该立即失败的代码错误。

**错误（捕获所有内容，包括错误）：**

```python
@retry(max_retries=3)  # 不要这样做
async def scrape_data():
    data = response['items'][0]  # 如果 'items' 不存在，重试无济于事！
    return data
```

**正确（仅对预期的失败重试）：**

```python
from pydoll.exceptions import ElementNotFound, WaitElementTimeout, NetworkError

@retry(
    max_retries=3,
    exceptions=[ElementNotFound, WaitElementTimeout, NetworkError]
)
async def scrape_data():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        return await tab.find(id='data-container', timeout=10)
```

通过指定异常，您可以确保：

- **逻辑错误快速失败** （拼写错误、错误的选择器、代码错误）
- **仅重试可恢复的错误** （网络问题、超时、缺失元素）
- **调试更容易** （您确切知道出了什么问题）

## 参数

### max_retries

放弃前的最大重试次数。

```python
from pydoll.exceptions import WaitElementTimeout

@retry(max_retries=5, exceptions=[WaitElementTimeout])
async def fetch_data():
    # 总共将尝试 5 次
    pass
```

### exceptions

应该触发重试的异常类型。可以是单个异常或列表。

```python
from pydoll.exceptions import (
    ElementNotFound,
    WaitElementTimeout,
    NetworkError,
    ElementNotInteractable
)

# 单个异常
@retry(exceptions=[WaitElementTimeout])
async def example1():
    pass

# 多个异常
@retry(exceptions=[WaitElementTimeout, NetworkError, ElementNotFound, ElementNotInteractable])
async def example2():
    pass
```

!!! tip "常见爬虫异常"
    对于使用 Pydoll 进行网页爬虫，您通常会希望重试：

    - `WaitElementTimeout` - 等待元素出现超时
    - `ElementNotFound` - DOM 中不存在元素
    - `ElementNotVisible` - 元素存在但不可见
    - `ElementNotInteractable` - 元素无法接收交互
    - `NetworkError` - 网络连接问题
    - `ConnectionFailed` - 连接浏览器失败
    - `PageLoadTimeout` - 页面加载超时
    - `ClickIntercepted` - 点击被另一个元素拦截

### delay

重试尝试之间的等待时间（以秒为单位）。

```python
from pydoll.exceptions import WaitElementTimeout

@retry(max_retries=3, exceptions=[WaitElementTimeout], delay=2.0)
async def scrape_with_delay():
    # 每次重试之间等待 2 秒
    pass
```

### exponential_backoff

当设置为 `True` 时，随着每次重试尝试，延迟会指数级增加。

```python
from pydoll.exceptions import NetworkError

@retry(
    max_retries=5,
    exceptions=[NetworkError],
    delay=1.0,
    exponential_backoff=True
)
async def scrape_with_backoff():
    # 尝试 1: 失败 → 等待 1 秒
    # 尝试 2: 失败 → 等待 2 秒
    # 尝试 3: 失败 → 等待 4 秒
    # 尝试 4: 失败 → 等待 8 秒
    # 尝试 5: 失败 → 抛出异常
    pass
```

**什么是指数退避？**

指数退避是一种重试策略，尝试之间的等待时间呈指数级增长。与其每秒对服务器发起请求，不如逐渐给服务器更多恢复时间：

- **尝试 1**：等待 `delay` 秒（例如 1 秒）
- **尝试 2**：等待 `delay * 2` 秒（例如 2 秒）
- **尝试 3**：等待 `delay * 4` 秒（例如 4 秒）
- **尝试 4**：等待 `delay * 8` 秒（例如 8 秒）

这在以下情况下特别有用：

- 处理 **速率限制** （给服务器时间重置）
- 处理 **临时服务器过载** （不要让情况变得更糟）
- 等待 **加载缓慢的动态内容**
- 避免 **被检测为机器人** （看起来自然的重试模式）

### on_retry

在每次失败尝试后、下次重试前执行的回调函数。必须是 **async 函数**。

```python
from pydoll.exceptions import WaitElementTimeout

@retry(
    max_retries=3,
    exceptions=[WaitElementTimeout],
    on_retry=my_recovery_function
)
async def scrape_data():
    pass
```

回调可以是：

- **独立的 async 函数**
- **类方法** （自动接收 `self`）

## on_retry 回调：您的恢复机制

`on_retry` 回调是真正神奇的地方。这是您在下次重试尝试之前 **恢复应用程序状态** 的机会。

### 独立函数

```python
import asyncio
from pydoll.decorators import retry
from pydoll.exceptions import WaitElementTimeout

async def log_retry():
    print("重试尝试失败，下次尝试前等待...")
    await asyncio.sleep(1)

@retry(max_retries=3, exceptions=[WaitElementTimeout], on_retry=log_retry)
async def scrape_page():
    # 您的爬虫逻辑
    pass
```

### 类方法

在类内部使用装饰器时，回调可以是类方法。它将自动接收 `self` 作为第一个参数。

```python
import asyncio
from pydoll.decorators import retry
from pydoll.exceptions import WaitElementTimeout

class DataCollector:
    def __init__(self):
        self.retry_count = 0
    
    # 重要：在装饰方法之前定义回调
    async def log_retry(self):
        self.retry_count += 1
        print(f"尝试 {self.retry_count} 失败，正在重试...")
        await asyncio.sleep(1)
    
    @retry(
        max_retries=3,
        exceptions=[WaitElementTimeout],
        on_retry=log_retry  # 不需要 'self.' 前缀
    )
    async def fetch_data(self):
        # 您的爬取逻辑
        pass
```

!!! warning "方法定义顺序很重要"
    使用类方法的 `on_retry` 时，**必须在类定义中的装饰方法之前定义回调方法**。Python 在应用装饰器时需要知道回调。

    **错误（会失败）：**

    ```python
    class Scraper:
        @retry(on_retry=handle_retry)  # handle_retry 还不存在！
        async def scrape(self):
            pass
        
        async def handle_retry(self):  # 定义太晚
            pass
    ```

    **正确：**

    ```python
    class Scraper:
        async def handle_retry(self):  # 首先定义
            pass
        
        @retry(on_retry=handle_retry)  # 现在存在
        async def scrape(self):
            pass
    ```

## 实际应用案例

### 1. 页面刷新和状态恢复

**这是 `on_retry` 最强大的用法**：通过刷新页面并恢复应用程序状态来从故障中恢复。此示例演示了为什么 retry 装饰器对生产爬虫如此有价值。

```python
from pydoll.browser.chromium import Chrome
from pydoll.decorators import retry
from pydoll.exceptions import ElementNotFound, WaitElementTimeout
from pydoll.constants import Key
import asyncio

class DataScraper:
    def __init__(self):
        self.browser = None
        self.tab = None
        self.current_page = 1
    
    async def recover_from_failure(self):
        """刷新页面并在重试前恢复状态"""
        print(f"恢复中... 刷新第 {self.current_page} 页")
        
        if self.tab:
            # 刷新页面以从陈旧元素或错误状态中恢复
            await self.tab.refresh()
            await asyncio.sleep(2)  # 等待页面加载
            
            # 恢复状态：导航回正确页面
            if self.current_page > 1:
                page_input = await self.tab.find(id='page-number')
                await page_input.insert_text(str(self.current_page))
                await self.tab.keyboard.press(Key.ENTER)
                await asyncio.sleep(1)
    
    @retry(
        max_retries=3,
        exceptions=[ElementNotFound, WaitElementTimeout],
        on_retry=recover_from_failure,
        delay=1.0
    )
    async def scrape_page_data(self):
        """从当前页面抓取数据"""
        if not self.browser:
            self.browser = Chrome()
            self.tab = await self.browser.start()
            await self.tab.go_to('https://example.com/data')
        
        # 导航到特定页面
        page_input = await self.tab.find(id='page-number')
        await page_input.insert_text(str(self.current_page))
        await self.tab.keyboard.press(Key.ENTER)
        await asyncio.sleep(1)
        
        # 抓取数据（如果元素变陈旧可能会失败）
        items = await self.tab.find(class_name='data-item', find_all=True)
        return [await item.text for item in items]
    
    async def scrape_multiple_pages(self, start_page: int, end_page: int):
        """抓取多个页面，失败时自动重试"""
        results = []
        for page_num in range(start_page, end_page + 1):
            self.current_page = page_num
            data = await self.scrape_page_data()
            results.extend(data)
        return results

# 用法
async def main():
    scraper = DataScraper()
    try:
        # 抓取第 1-10 页，失败时自动恢复
        all_data = await scraper.scrape_multiple_pages(1, 10)
        print(f"已抓取 {len(all_data)} 个项目")
    finally:
        if scraper.browser:
            await scraper.browser.stop()
```

**这为什么强大：**

- `recover_from_failure()` 真正**恢复状态**：刷新并导航回来
- `scrape_page_data()` 方法保持简洁，只专注于爬取逻辑
- 如果元素变陈旧或消失，重试机制会自动处理恢复
- 浏览器通过 `self.browser` 和 `self.tab` 在重试之间保持

### 2. 模态对话框恢复

有时模态框或遮罩层会意外出现并阻止自动化。关闭它并重试。

```python
from pydoll.browser.chromium import Chrome
from pydoll.decorators import retry
from pydoll.exceptions import ElementNotFound

class ModalAwareScraper:
    def __init__(self):
        self.tab = None
    
    async def close_modals(self):
        """在重试前关闭任何阻挡的模态框"""
        print("检查阻挡的模态框...")
        
        # 尝试查找并关闭常见模态框
        modal_close = await self.tab.find(
            class_name='modal-close',
            timeout=2,
            raise_exc=False
        )
        if modal_close:
            print("找到模态框，关闭中...")
            await modal_close.click()
            await asyncio.sleep(0.5)
    
    @retry(
        max_retries=3,
        exceptions=[ElementNotFound],
        on_retry=close_modals,
        delay=0.5
    )
    async def click_button(self, button_id: str):
        button = await self.tab.find(id=button_id)
        await button.click()
```

### 3. 浏览器重启和代理轮换

对于大型爬虫任务，失败后可能需要完全重启浏览器并切换代理。

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions
from pydoll.decorators import retry
from pydoll.exceptions import NetworkError, PageLoadTimeout

class RobustScraper:
    def __init__(self):
        self.browser = None
        self.tab = None
        self.proxy_list = [
            'proxy1.example.com:8080',
            'proxy2.example.com:8080',
            'proxy3.example.com:8080',
        ]
        self.current_proxy_index = 0
    
    async def restart_with_new_proxy(self):
        """使用不同代理重启浏览器"""
        print("使用新代理重启浏览器...")
        
        # 关闭当前浏览器
        if self.browser:
            await self.browser.stop()
            await asyncio.sleep(2)
        
        # 轮换到下一个代理
        self.current_proxy_index = (self.current_proxy_index + 1) % len(self.proxy_list)
        proxy = self.proxy_list[self.current_proxy_index]
        
        print(f"使用代理: {proxy}")
        
        # 使用新代理启动新浏览器
        options = ChromiumOptions()
        options.add_argument(f'--proxy-server={proxy}')
        
        self.browser = Chrome(options=options)
        self.tab = await self.browser.start()
    
    @retry(
        max_retries=3,
        exceptions=[NetworkError, PageLoadTimeout],
        on_retry=restart_with_new_proxy,
        delay=5.0,
        exponential_backoff=True
    )
    async def scrape_protected_site(self, url: str):
        if not self.browser:
            await self.restart_with_new_proxy()
        
        await self.tab.go_to(url)
        await asyncio.sleep(3)
        
        # 您的爬虫逻辑
        content = await self.tab.find(id='content')
        return await content.text
```

### 4. 网络空闲检测与重试

等待所有网络活动完成，如果页面从未稳定则使用重试逻辑。

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.decorators import retry
from pydoll.exceptions import TimeoutException

class NetworkAwareScraper:
    def __init__(self):
        self.tab = None
    
    async def reload_page(self):
        """如果网络从未稳定则重新加载页面"""
        print("页面未稳定，重新加载...")
        if self.tab:
            await self.tab.refresh()
            await asyncio.sleep(2)
    
    @retry(
        max_retries=2,
        exceptions=[TimeoutException],
        on_retry=reload_page,
        delay=3.0
    )
    async def wait_for_page_ready(self):
        """等待所有网络请求完成"""
        await self.tab.enable_network_events()
        
        # 等待网络空闲（2 秒内无请求）
        idle_time = 0
        max_wait = 10
        
        while idle_time < max_wait:
            # 检查是否有正在进行的请求
            # （实现取决于您的事件跟踪）
            await asyncio.sleep(0.5)
            idle_time += 0.5
        
        if idle_time >= max_wait:
            raise TimeoutException("网络从未稳定")
```

### 5. 验证码检测和恢复

检测验证码何时出现并采取适当行动。

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.decorators import retry
from pydoll.exceptions import ElementNotFound

class CaptchaScraper:
    def __init__(self):
        self.tab = None
        self.captcha_count = 0
    
    async def handle_captcha(self):
        """通过等待或切换策略处理验证码"""
        self.captcha_count += 1
        print(f"检测到验证码（计数：{self.captcha_count}）")
        
        if self.captcha_count > 2:
            print("验证码过多，可能需要更改策略...")
            # 可以在这里切换到不同的方法
        
        # 尝试之间等待更长时间
        await asyncio.sleep(30)
        
        # 刷新页面
        await self.tab.refresh()
        await asyncio.sleep(5)
    
    @retry(
        max_retries=3,
        exceptions=[ElementNotFound],
        on_retry=handle_captcha,
        delay=10.0,
        exponential_backoff=True
    )
    async def scrape_protected_content(self, url: str):
        if not self.tab:
            browser = Chrome()
            self.tab = await browser.start()
        
        await self.tab.go_to(url)
        
        # 检查验证码
        captcha = await self.tab.find(
            class_name='g-recaptcha',
            timeout=2,
            raise_exc=False
        )
        
        if captcha:
            raise ElementNotFound("检测到验证码")
        
        # 正常爬虫逻辑
        content = await self.tab.find(class_name='article-content')
        return await content.text
```

## 高级模式

### 组合多种恢复策略

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.decorators import retry
from pydoll.exceptions import ElementNotFound, WaitElementTimeout, NetworkError

class AdvancedScraper:
    def __init__(self):
        self.tab = None
        self.attempt = 0
        self.strategies = [
            self.strategy_refresh,
            self.strategy_clear_cache,
            self.strategy_restart_browser,
        ]
    
    async def strategy_refresh(self):
        """策略 1：简单刷新"""
        print("策略 1：刷新页面")
        await self.tab.refresh()
        await asyncio.sleep(2)
    
    async def strategy_clear_cache(self):
        """策略 2：清除缓存并刷新"""
        print("策略 2：清除缓存")
        await self.tab.execute_command('Network.clearBrowserCache')
        await self.tab.refresh()
        await asyncio.sleep(3)
    
    async def strategy_restart_browser(self):
        """策略 3：完全重启浏览器"""
        print("策略 3：重启浏览器")
        if self.tab:
            await self.tab._browser.stop()
        
        browser = Chrome()
        self.tab = await browser.start()
    
    async def adaptive_recovery(self):
        """根据尝试次数尝试不同的恢复策略"""
        strategy_index = min(self.attempt, len(self.strategies) - 1)
        strategy = self.strategies[strategy_index]
        
        print(f"尝试 {self.attempt + 1}：使用 {strategy.__name__}")
        await strategy()
        
        self.attempt += 1
    
    @retry(
        max_retries=3,
        exceptions=[ElementNotFound, WaitElementTimeout, NetworkError],
        on_retry=adaptive_recovery,
        delay=2.0
    )
    async def scrape_with_adaptive_retry(self, url: str):
        await self.tab.go_to(url)
        return await self.tab.find(id='target-content')
```

### 特定失败的自定义异常

```python
import asyncio
from pydoll.decorators import retry
from pydoll.exceptions import PydollException

class RateLimitError(PydollException):
    """检测到速率限制时引发"""
    message = "API 速率限制已超出"

class APIScraper:
    async def wait_for_rate_limit_reset(self):
        """被速率限制时等待更长时间"""
        print("检测到速率限制，等待 60 秒...")
        await asyncio.sleep(60)
    
    @retry(
        max_retries=5,
        exceptions=[RateLimitError],
        on_retry=wait_for_rate_limit_reset,
        delay=10.0,
        exponential_backoff=True
    )
    async def fetch_api_data(self, endpoint: str):
        response = await self.tab.request.get(endpoint)
        
        if response.status == 429:  # 请求过多
            raise RateLimitError("API 速率限制已超出")
        
        return response.json()
```

## 最佳实践总结

1. **始终明确指定异常** - 永不使用默认的 `exceptions=Exception`
2. **对外部服务使用指数退避** - 给服务器恢复时间
3. **保持合理的重试次数** - 通常 3-5 次尝试就足够了
4. **记录重试尝试** - 使用 `on_retry` 记录发生的事情
5. **在装饰方法之前定义回调** - 类定义中的顺序很重要
6. **使回调异步** - 装饰器需要异步回调
7. **在回调中恢复状态** - 使用 `on_retry` 导航回原位置
8. **考虑重试的成本** - 每次重试都会消耗时间和资源
9. **与其他错误处理结合** - 重试不能替代 try/except 块
10. **测试您的重试逻辑** - 确保恢复回调实际有效

## 了解更多

- **[异常处理](../core-concepts.md#error-handling)** - 理解 Pydoll 异常
- **[网络事件](../network/monitoring.md)** - 跟踪和处理网络故障
- **[浏览器选项](../configuration/browser-options.md)** - 配置代理和其他设置
- **[事件系统](event-system.md)** - 构建响应式重试策略

retry 装饰器是一个强大的工具，可以将脆弱的爬虫脚本转变为生产就绪的应用程序。通过将其与周到的恢复策略相结合，您可以构建能够优雅地处理真实网络混乱情况的爬虫。


================================================
FILE: docs/zh/features/advanced/event-system.md
================================================
# 事件系统

Pydoll 的事件系统允许您实时监听和响应浏览器活动。这对于构建动态自动化、监控网络请求、检测页面更改和创建响应式工作流至关重要。

!!! info "提供深入探讨"
    本指南专注于实际使用。有关架构细节和内部实现，请参阅[事件架构深入探讨](../../deep-dive/event-architecture.md)。

## 前提条件

在使用事件之前，您需要启用相应的 CDP 域：

```python
from pydoll.browser.chromium import Chrome

async with Chrome() as browser:
    tab = await browser.start()
    
    # 在监听事件之前启用域
    await tab.enable_page_events()     # 用于页面生命周期事件
    await tab.enable_network_events()  # 用于网络活动
    await tab.enable_dom_events()      # 用于 DOM 更改
```

!!! warning "不启用事件将不会触发"
    如果您注册了回调但忘记启用域，您的回调将永远不会被触发。始终先启用域！

## 基本事件监听

`on()` 方法注册事件监听器：

```python
from pydoll.protocol.page.events import PageEvent, LoadEventFiredEvent

async def handle_page_load(event: LoadEventFiredEvent):
    print(f"页面在 {event['params']['timestamp']} 加载完成")

# 注册回调
await tab.enable_page_events()
callback_id = await tab.on(PageEvent.LOAD_EVENT_FIRED, handle_page_load)
```

### 事件结构

所有事件遵循相同的结构：

```python
{
    'method': 'Page.loadEventFired',  # 事件名称
    'params': {                        # 事件特定数据
        'timestamp': 123456.789
    }
}
```

通过 `event['params']` 访问事件数据：

```python
from pydoll.protocol.network.events import RequestWillBeSentEvent

async def handle_request(event: RequestWillBeSentEvent):
    url = event['params']['request']['url']
    method = event['params']['request']['method']
    print(f"{method} {url}")
```

### 使用类型提示以获得更好的 IDE 支持

使用事件参数类型的类型提示来获取事件键的自动完成：

```python
from pydoll.protocol.network.events import NetworkEvent, RequestWillBeSentEvent
from pydoll.protocol.page.events import PageEvent, LoadEventFiredEvent

# 使用类型提示 - IDE 知道所有可用的键！
async def handle_request(event: RequestWillBeSentEvent):
    # IDE 将自动完成 'params'、'request'、'url' 等
    url = event['params']['request']['url']
    method = event['params']['request']['method']
    timestamp = event['params']['timestamp']
    print(f"{method} {url} 在 {timestamp}")

async def handle_load(event: LoadEventFiredEvent):
    # IDE 知道此事件在 params 中有 'timestamp'
    timestamp = event['params']['timestamp']
    print(f"页面在 {timestamp} 加载完成")

await tab.enable_network_events()
await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, handle_request)

await tab.enable_page_events()
await tab.on(PageEvent.LOAD_EVENT_FIRED, handle_load)
```

!!! tip "事件参数的类型提示"
    所有事件类型都定义在 `pydoll.protocol.<domain>.events` 中。使用它们可以获得：
    
    - **自动完成**：IDE 建议 `event['params']` 中的可用键
    - **类型安全**：在运行代码之前捕获拼写错误
    - **文档**：查看每个事件提供的数据
    
    事件类型遵循模式：`<EventName>Event`（例如，`RequestWillBeSentEvent`、`ResponseReceivedEvent`）

## 常见事件域

### 页面事件

监控页面生命周期和对话框：

```python
from pydoll.protocol.page.events import PageEvent, JavascriptDialogOpeningEvent

await tab.enable_page_events()

# 页面已加载
await tab.on(PageEvent.LOAD_EVENT_FIRED, lambda e: print("页面已加载！"))

# DOM 就绪
await tab.on(PageEvent.DOM_CONTENT_EVENT_FIRED, lambda e: print("DOM 就绪！"))

# JavaScript 对话框
async def handle_dialog(event: JavascriptDialogOpeningEvent):
    message = event['params']['message']
    dialog_type = event['params']['type']
    print(f"对话框 ({dialog_type}): {message}")
    
    # 自动处理
    if await tab.has_dialog():
        await tab.handle_dialog(accept=True)

await tab.on(PageEvent.JAVASCRIPT_DIALOG_OPENING, handle_dialog)
```

### 网络事件

监控请求和响应：

```python
from pydoll.protocol.network.events import (
    NetworkEvent,
    RequestWillBeSentEvent,
    ResponseReceivedEvent,
    LoadingFailedEvent
)

await tab.enable_network_events()

# 跟踪请求
async def log_request(event: RequestWillBeSentEvent):
    request = event['params']['request']
    print(f"→ {request['method']} {request['url']}")

await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, log_request)

# 跟踪响应
async def log_response(event: ResponseReceivedEvent):
    response = event['params']['response']
    print(f"← {response['status']} {response['url']}")

await tab.on(NetworkEvent.RESPONSE_RECEIVED, log_response)

# 跟踪失败
async def log_failure(event: LoadingFailedEvent):
    url = event['params']['type']
    error = event['params']['errorText']
    print(f"[失败] {url} - {error}")

await tab.on(NetworkEvent.LOADING_FAILED, log_failure)
```

### DOM 事件

响应 DOM 更改：

```python
from pydoll.protocol.dom.events import DomEvent, AttributeModifiedEvent

await tab.enable_dom_events()

# 跟踪属性更改
async def on_attribute_change(event: AttributeModifiedEvent):
    node_id = event['params']['nodeId']
    attr_name = event['params']['name']
    attr_value = event['params']['value']
    print(f"节点 {node_id}: {attr_name}={attr_value}")

await tab.on(DomEvent.ATTRIBUTE_MODIFIED, on_attribute_change)

# 跟踪文档更新
await tab.on(DomEvent.DOCUMENT_UPDATED, lambda e: print("文档已更新！"))
```

## 临时回调

使用 `temporary=True` 进行一次性监听器：

```python
from pydoll.protocol.page.events import PageEvent

# 这只会触发一次，然后自动删除
await tab.on(
    PageEvent.LOAD_EVENT_FIRED,
    lambda e: print("首次加载！"),
    temporary=True
)

await tab.go_to("https://example.com")  # 触发回调
await tab.refresh()                      # 回调不会再次触发
```

!!! tip "非常适合一次性设置"
    临时回调非常适合只应发生一次的初始化任务。

## 在回调中访问 Tab

使用 `functools.partial` 将 tab 传递给您的回调：

```python
from functools import partial
from pydoll.protocol.network.events import NetworkEvent, ResponseReceivedEvent

async def process_response(tab, event: ResponseReceivedEvent):
    # 现在我们可以使用 tab 对象！
    request_id = event['params']['requestId']
    
    # 获取响应体
    body = await tab.get_network_response_body(request_id)
    print(f"响应体: {body[:100]}...")

await tab.enable_network_events()
await tab.on(
    NetworkEvent.RESPONSE_RECEIVED,
    partial(process_response, tab)
)
```

!!! info "为什么使用 Partial？"
    事件系统只将事件数据传递给回调。`partial` 允许您绑定其他参数，如 tab 实例。

## 管理回调

### 删除回调

```python
from pydoll.protocol.page.events import PageEvent

# 保存回调 ID
callback_id = await tab.on(PageEvent.LOAD_EVENT_FIRED, my_callback)

# 稍后删除它
await tab.remove_callback(callback_id)
```

### 清除所有回调

```python
# 删除此 tab 的所有已注册回调
await tab.clear_callbacks()
```

## 实用示例

### 监控 API 调用

```python
import asyncio
from functools import partial
from pydoll.protocol.network.events import NetworkEvent, ResponseReceivedEvent

async def monitor_api_calls(tab):
    collected_data = []
    
    # 类型提示帮助 IDE 自动完成事件键
    async def capture_api_response(tab, data_list, event: ResponseReceivedEvent):
        url = event['params']['response']['url']
        
        # 仅过滤 API 调用
        if '/api/' not in url:
            return
        
        request_id = event['params']['requestId']
        body = await tab.get_network_response_body(request_id)
        
        data_list.append({
            'url': url,
            'body': body,
            'status': event['params']['response']['status']
        })
        print(f"捕获 API 调用: {url}")
    
    await tab.enable_network_events()
    await tab.on(
        NetworkEvent.RESPONSE_RECEIVED,
        partial(capture_api_response, tab, collected_data)
    )
    
    # 导航并收集
    await tab.go_to("https://example.com")
    await asyncio.sleep(3)  # 等待请求完成
    
    return collected_data
```

### 等待特定事件

```python
import asyncio
from pydoll.protocol.page.events import PageEvent, FrameNavigatedEvent

async def wait_for_navigation():
    navigation_done = asyncio.Event()
    
    async def on_navigated(event: FrameNavigatedEvent):
        navigation_done.set()
    
    await tab.enable_page_events()
    await tab.on(PageEvent.FRAME_NAVIGATED, on_navigated, temporary=True)
    
    # 触发导航
    button = await tab.find(id='next-page')
    await button.click()
    
    # 等待它完成
    await navigation_done.wait()
    print("导航完成！")
```

### 网络空闲检测

```python
import asyncio
from pydoll.protocol.network.events import (
    NetworkEvent,
    RequestWillBeSentEvent,
    LoadingFinishedEvent,
    LoadingFailedEvent
)

async def wait_for_network_idle(tab, timeout=5):
    in_flight = 0
    idle_event = asyncio.Event()
    last_activity = asyncio.get_event_loop().time()
    
    async def on_request(event: RequestWillBeSentEvent):
        nonlocal in_flight, last_activity
        in_flight += 1
        last_activity = asyncio.get_event_loop().time()
    
    async def on_finished(event: LoadingFinishedEvent | LoadingFailedEvent):
        nonlocal in_flight, last_activity
        in_flight -= 1
        last_activity = asyncio.get_event_loop().time()
        
        if in_flight == 0:
            idle_event.set()
    
    await tab.enable_network_events()
    req_id = await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, on_request)
    fin_id = await tab.on(NetworkEvent.LOADING_FINISHED, on_finished)
    fail_id = await tab.on(NetworkEvent.LOADING_FAILED, on_finished)
    
    try:
        await asyncio.wait_for(idle_event.wait(), timeout=timeout)
        print("网络空闲！")
    except asyncio.TimeoutError:
        print(f"{timeout}秒后网络仍然活跃")
    finally:
        # 清理
        await tab.remove_callback(req_id)
        await tab.remove_callback(fin_id)
        await tab.remove_callback(fail_id)
```

### 动态内容抓取

```python
import asyncio
import json
from functools import partial
from pydoll.protocol.network.events import NetworkEvent, ResponseReceivedEvent

async def scrape_infinite_scroll(tab, max_items=100):
    items = []
    
    async def capture_products(tab, items_list, event: ResponseReceivedEvent):
        url = event['params']['response']['url']
        
        # 查找产品 API 端点
        if '/products' not in url:
            return
        
        request_id = event['params']['requestId']
        body = await tab.get_network_response_body(request_id)
        
        try:
            data = json.loads(body)
            if 'items' in data:
                items_list.extend(data['items'])
                print(f"收集了 {len(data['items'])} 个项目（总计: {len(items_list)}）")
        except json.JSONDecodeError:
            pass
    
    await tab.enable_network_events()
    await tab.on(
        NetworkEvent.RESPONSE_RECEIVED,
        partial(capture_products, tab, items)
    )
    
    await tab.go_to("https://example.com/products")
    
    # 滚动以触发无限加载
    while len(items) < max_items:
        await tab.execute_script("window.scrollTo(0, document.body.scrollHeight)")
        await asyncio.sleep(1)
    
    return items[:max_items]
```

## 事件参考表

### 可用域

| 域 | 启用方法 | 常见用例 |
|--------|--------------|------------------|
| Page | `enable_page_events()` | 页面生命周期、导航、对话框 |
| Network | `enable_network_events()` | 请求/响应监控、API 跟踪 |
| DOM | `enable_dom_events()` | DOM 结构更改、属性修改 |
| Fetch | `enable_fetch_events()` | 请求拦截和修改 |
| Runtime | `enable_runtime_events()` | 控制台消息、JavaScript 异常 |

### 关键页面事件

| 事件 | 何时触发 | 用例 |
|-------|---------------|----------|
| `LOAD_EVENT_FIRED` | 页面加载完成 | 等待完整页面加载 |
| `DOM_CONTENT_EVENT_FIRED` | DOM 就绪 | 开始 DOM 操作 |
| `JAVASCRIPT_DIALOG_OPENING` | Alert/confirm/prompt | 自动处理对话框 |
| `FRAME_NAVIGATED` | 导航完成 | 跟踪 SPA 导航 |
| `FILE_CHOOSER_OPENED` | 文件输入被点击 | 自动化文件上传 |

### 关键网络事件

| 事件 | 何时触发 | 用例 |
|-------|---------------|----------|
| `REQUEST_WILL_BE_SENT` | 请求发送前 | 记录/修改传出请求 |
| `RESPONSE_RECEIVED` | 接收响应头 | 捕获 API 响应 |
| `LOADING_FINISHED` | 响应体加载完成 | 获取完整响应数据 |
| `LOADING_FAILED` | 请求失败 | 跟踪错误和重试 |
| `WEB_SOCKET_CREATED` | WebSocket 打开 | 监控实时连接 |

### 关键 DOM 事件

| 事件 | 何时触发 | 用例 |
|-------|---------------|----------|
| `DOCUMENT_UPDATED` | DOM 重建 | 刷新元素引用 |
| `ATTRIBUTE_MODIFIED` | 元素属性更改 | 跟踪动态属性更改 |
| `CHILD_NODE_INSERTED` | 添加新元素 | 检测动态添加的内容 |
| `CHILD_NODE_REMOVED` | 删除元素 | 检测删除的内容 |

### 事件类型参考

所有事件类型及其参数结构都定义在协议模块中：

| 域 | 导入路径 | 示例类型 |
|--------|-------------|---------------|
| Page | `pydoll.protocol.page.events` | `LoadEventFiredEvent`、`FrameNavigatedEvent`、`JavascriptDialogOpeningEvent` |
| Network | `pydoll.protocol.network.events` | `RequestWillBeSentEvent`、`ResponseReceivedEvent`、`LoadingFinishedEvent` |
| DOM | `pydoll.protocol.dom.events` | `DocumentUpdatedEvent`、`AttributeModifiedEvent`、`ChildNodeInsertedEvent` |
| Fetch | `pydoll.protocol.fetch.events` | `RequestPausedEvent`、`AuthRequiredEvent` |
| Runtime | `pydoll.protocol.runtime.events` | `ConsoleAPICalledEvent`、`ExceptionThrownEvent` |

每个事件类型都是一个 `TypedDict`，定义了事件的确切结构，包括 `params` 字典中的所有可用键。

## 最佳实践

### 1. 始终先启用域

```python
from pydoll.protocol.network.events import NetworkEvent

# 好
await tab.enable_network_events()
await tab.on(NetworkEvent.RESPONSE_RECEIVED, callback)

# 坏：回调永远不会触发
await tab.on(NetworkEvent.RESPONSE_RECEIVED, callback)
await tab.enable_network_events()
```

### 2. 完成后清理

```python
from pydoll.protocol.network.events import NetworkEvent

# 为特定任务启用
await tab.enable_network_events()
callback_id = await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, log_request)

# 执行您的工作...
await tab.go_to("https://example.com")

# 清理
await tab.remove_callback(callback_id)
await tab.disable_network_events()
```

### 3. 使用早期过滤

```python
from pydoll.protocol.network.events import RequestWillBeSentEvent

# 好：早期过滤
async def handle_api_request(event: RequestWillBeSentEvent):
    url = event['params']['request']['url']
    if '/api/' not in url:
        return  # 提前退出
    
    # 仅处理 API 请求
    process_request(event)

# 坏：处理所有内容
async def handle_all_requests(event: RequestWillBeSentEvent):
    url = event['params']['request']['url']
    process_request(event)
    if '/api/' in url:
        do_extra_work(event)
```

### 4. 优雅地处理错误

```python
from pydoll.protocol.network.events import ResponseReceivedEvent

async def safe_callback(event: ResponseReceivedEvent):
    try:
        request_id = event['params']['requestId']
        body = await tab.get_network_response_body(request_id)
        process_body(body)
    except KeyError:
        # 事件可能没有 requestId
        pass
    except Exception as e:
        print(f"回调中的错误: {e}")
        # 继续而不中断事件循环
```

## 性能注意事项

!!! warning "高频事件"
    DOM 事件在动态页面上可能**非常频繁地**触发。使用过滤和防抖动以避免性能问题。

### 按域划分的事件量

| 域 | 事件频率 | 性能影响 |
|--------|----------------|-------------------|
| Page | 低 | 最小 |
| Network | 中-高 | 中等 |
| DOM | 非常高 | 高 |
| Fetch | 中等 | 中等 |

### 优化技巧

1. **仅启用您需要的**：不要一次启用所有域
2. **使用临时回调**：尽可能自动清理
3. **早期过滤**：在昂贵的操作之前检查条件
4. **完成后禁用**：释放资源
5. **避免繁重的处理**：保持回调快速，将工作卸载到单独的任务

```python
import asyncio
from pydoll.protocol.network.events import ResponseReceivedEvent

# 好：快速回调，卸载繁重的工作
async def handle_response(event: ResponseReceivedEvent):
    if should_process(event):
        asyncio.create_task(heavy_processing(event))  # 不阻塞

# 坏：阻塞事件循环
async def handle_response(event: ResponseReceivedEvent):
    await heavy_processing(event)  # 阻塞其他事件
```

## 常见模式

### 事件的上下文管理器

```python
from contextlib import asynccontextmanager
from pydoll.protocol.network.events import NetworkEvent, RequestWillBeSentEvent

@asynccontextmanager
async def monitor_requests(tab):
    """在块期间监控请求的上下文管理器。"""
    requests = []
    
    async def capture(event: RequestWillBeSentEvent):
        requests.append(event['params']['request'])
    
    await tab.enable_network_events()
    cb_id = await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, capture)
    
    try:
        yield requests
    finally:
        await tab.remove_callback(cb_id)
        await tab.disable_network_events()

# 用法
async with monitor_requests(tab) as requests:
    await tab.go_to("https://example.com")
    # 捕获所有请求

print(f"捕获了 {len(requests)} 个请求")
```

### 条件事件注册

```python
from pydoll.protocol.network.events import NetworkEvent
from pydoll.protocol.dom.events import DomEvent

async def setup_monitoring(tab, track_network=False, track_dom=False):
    """仅启用指定的监控。"""
    callbacks = []
    
    if track_network:
        await tab.enable_network_events()
        cb = await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, log_request)
        callbacks.append(('network', cb))
    
    if track_dom:
        await tab.enable_dom_events()
        cb = await tab.on(DomEvent.ATTRIBUTE_MODIFIED, log_dom_change)
        callbacks.append(('dom', cb))
    
    return callbacks
```

## 进一步阅读

- **[事件架构深入探讨](../../deep-dive/event-architecture.md)** - 内部实现和 WebSocket 通信
- **[网络监控](../network/monitoring.md)** - 高级网络分析技术
- **[响应式自动化](reactive-automation.md)** - 构建事件驱动的工作流

!!! tip "从简单开始"
    从 Page 事件开始了解基础知识，然后根据需要转向 Network 和 DOM 事件。事件系统很强大，但一开始可能会让人不知所措。

================================================
FILE: docs/zh/features/advanced/remote-connections.md
================================================
# 远程连接和混合自动化

Pydoll 允许您通过 WebSocket 连接到已运行的浏览器，实现远程控制和混合自动化场景。这非常适合 CI/CD 管道、容器化环境、调试会话以及将 Pydoll 与现有 CDP 工具集成。

!!! info "无需设置"
    与启动浏览器的传统自动化不同，远程连接让您控制已经运行的浏览器。不需要进程管理！

## 为什么使用远程连接？

远程连接解锁了强大的自动化场景：

| 用例 | 好处 |
|----------|---------|
| **CI/CD 管道** | 连接到浏览器容器而无需管理进程 |
| **Docker 环境** | 控制在单独容器中运行的浏览器 |
| **远程调试** | 自动化远程服务器或虚拟机上的浏览器 |
| **混合工具** | 将 Pydoll 与现有 CDP 基础设施集成 |
| **开发** | 连接到本地浏览器进行快速测试 |
| **多工具自动化** | 在不同工具之间共享浏览器会话 |

## 设置远程浏览器服务器

!!! tip "已经有远程浏览器服务？"
    如果您正在使用云浏览器服务（BrowserStack、Selenium Grid、LambdaTest 等）或已经有一个运行中的 Chrome 实例并带有 WebSocket URL，您可以**跳过整个部分**，直接跳转到[连接方法](#connection-methods)了解如何使用 Pydoll 连接。

在远程连接之前，您需要启动启用了调试并正确配置以接受外部连接的 Chrome。

### 基本服务器设置（Linux）

在服务器上启动带有远程调试的 Chrome：

```bash
# 基本设置 - 仅从 localhost 可访问
google-chrome \
  --remote-debugging-port=9222 \
  --headless=new \
  --no-sandbox \
  --disable-dev-shm-usage \
  --user-data-dir=/tmp/chrome-profile

# 服务器设置 - 从其他机器可访问
google-chrome \
  --remote-debugging-port=9222 \
  --remote-debugging-address=0.0.0.0 \
  --headless=new \
  --no-sandbox \
  --disable-dev-shm-usage \
  --user-data-dir=/tmp/chrome-profile
```

!!! warning "安全关键"
    使用 `--remote-debugging-address=0.0.0.0` 使调试端口可从**任何网络接口**访问。这对于远程连接是必要的，但如果暴露到互联网，会造成重大安全风险。

### 推荐的服务器配置

```bash
# 生产就绪配置
google-chrome \
  --remote-debugging-port=9222 \
  --remote-debugging-address=0.0.0.0 \
  --headless=new \
  --no-sandbox \
  --disable-dev-shm-usage \
  --disable-gpu \
  --disable-software-rasterizer \
  --disable-extensions \
  --disable-background-networking \
  --disable-background-timer-throttling \
  --disable-client-side-phishing-detection \
  --disable-popup-blocking \
  --disable-prompt-on-repost \
  --disable-sync \
  --metrics-recording-only \
  --no-first-run \
  --safebrowsing-disable-auto-update \
  --user-data-dir=/tmp/chrome-remote-$(date +%s)
```

**关键标志说明：**

| 标志 | 目的 |
|------|---------|
| `--remote-debugging-port=9222` | 在端口 9222 上启用 CDP |
| `--remote-debugging-address=0.0.0.0` | 允许外部连接（安全风险！） |
| `--headless=new` | 无 GUI 运行（服务器模式） |
| `--no-sandbox` | 在 Docker/容器中必需（安全权衡） |
| `--disable-dev-shm-usage` | 防止容器中的 /dev/shm 内存问题 |
| `--disable-gpu` | 无 GPU 加速（建议用于无头模式） |
| `--user-data-dir=/tmp/...` | 每个实例的隔离配置文件 |

!!! warning "关于 --no-sandbox 标志"
    `--no-sandbox` 标志禁用 Chrome 的安全沙箱，该沙箱将浏览器进程与系统隔离。由于内核能力限制，此标志在大多数 Docker/容器环境中是**必需的**，但它带来了安全影响：
    
    - **风险**：移除浏览器和系统之间的隔离
    - **何时使用**：Docker 容器、受限环境
    - **缓解措施**：确保容器级隔离（命名空间、cgroups）并避免以 root 身份运行
    
    仅在绝对必要时考虑使用 `--no-sandbox`，并在容器级别实施额外的安全层。

### Docker 设置

创建容器化的 Chrome 服务器：

!!! tip "使用预构建镜像"
    对于生产环境，考虑使用官方预构建镜像而不是自己构建：
    
    - **Selenium 镜像**：`selenium/standalone-chrome`（包含 WebDriver）
    - **Zenika Alpine Chrome**：`zenika/alpine-chrome`（轻量级，约 200MB）
    - **Browserless**：`browserless/chrome`（生产就绪，带监控）
    
    这些镜像定期更新、经过安全测试，并针对容器环境进行了优化。

**Dockerfile（自定义构建）：**
```dockerfile
FROM ubuntu:22.04

# 安装 Chrome
RUN apt-get update && apt-get install -y \
    wget \
    gnupg \
    ca-certificates \
    && wget -q -O - https://dl.google.com/linux/linux_signing_key.pub | apt-key add - \
    && echo "deb [arch=amd64] http://dl.google.com/linux/chrome/deb/ stable main" >> /etc/apt/sources.list.d/google.list \
    && apt-get update \
    && apt-get install -y google-chrome-stable \
    && rm -rf /var/lib/apt/lists/*

# 暴露调试端口
EXPOSE 9222

# 使用远程调试启动 Chrome
CMD ["google-chrome", \
     "--remote-debugging-port=9222", \
     "--remote-debugging-address=0.0.0.0", \
     "--headless=new", \
     "--no-sandbox", \
     "--disable-dev-shm-usage", \
     "--disable-gpu", \
     "--user-data-dir=/tmp/chrome-profile"]
```

**docker-compose.yml：**
```yaml
services:
  chrome-server:
    build: .
    ports:
      - "127.0.0.1:9222:9222"
    
    # 仅当您需要远程访问且已使用防火墙或代理保护端口时，取消注释下面的行。
    # - "9222:9222"

    shm_size: '2gb'  # 关键：Chrome 使用 /dev/shm 进行共享内存
                      # 默认的 Docker shm_size（64MB）不足
    restart: unless-stopped
    environment:
      - DISPLAY=:99
    networks:
      - automation-network
    # 可选：生产环境的资源限制
    # deploy:
    #   resources:
    #     limits:
    #       cpus: '2'
    #       memory: 4G

  automation-client:
    image: python:3.11
    depends_on:
      - chrome-server
    volumes:
      - ./:/app
    working_dir: /app
    command: python automation_script.py
    environment:
      - CHROME_WS=ws://chrome-server:9222/devtools/browser
    networks:
      - automation-network

networks:
  automation-network:
    driver: bridge
```

**用法：**
```bash
# 启动堆栈
docker-compose up -d

# 检查 Chrome 是否运行
curl http://localhost:9222/json/version

# 从自动化客户端连接（在 Docker 网络内）
# ws://chrome-server:9222/devtools/browser/...
```

### Systemd 服务（Linux 服务器）

创建持久的 Chrome 服务：

**/etc/systemd/system/chrome-remote.service：**
```ini
[Unit]
Description=Chrome Remote Debugging Server
After=network.target

[Service]
Type=simple
User=chrome-user
Group=chrome-user
Environment="DISPLAY=:99"
ExecStart=/usr/bin/google-chrome \
    --remote-debugging-port=9222 \
    --remote-debugging-address=0.0.0.0 \
    --headless=new \
    --no-sandbox \
    --disable-dev-shm-usage \
    --disable-gpu \
    --user-data-dir=/var/lib/chrome-remote
Restart=always
RestartSec=10

[Install]
WantedBy=multi-user.target
```

**设置和管理：**
```bash
# 创建专用用户
sudo useradd -r -s /bin/false chrome-user
sudo mkdir -p /var/lib/chrome-remote
sudo chown chrome-user:chrome-user /var/lib/chrome-remote

# 安装并启用服务
sudo systemctl daemon-reload
sudo systemctl enable chrome-remote
sudo systemctl start chrome-remote

# 检查状态
sudo systemctl status chrome-remote

# 查看日志
sudo journalctl -u chrome-remote -f

# 重启服务
sudo systemctl restart chrome-remote
```

### 网络安全配置

#### 防火墙规则（iptables）

```bash
# 仅允许特定 IP 访问端口 9222
sudo iptables -A INPUT -p tcp --dport 9222 -s 192.168.1.100 -j ACCEPT
sudo iptables -A INPUT -p tcp --dport 9222 -j DROP

# 保存规则
sudo iptables-save > /etc/iptables/rules.v4
```

#### 防火墙规则（ufw）

```bash
# 默认拒绝对端口 9222 的所有访问
sudo ufw deny 9222

# 允许特定 IP
sudo ufw allow from 192.168.1.100 to any port 9222

# 允许特定子网
sudo ufw allow from 192.168.1.0/24 to any port 9222

# 启用防火墙
sudo ufw enable
```

#### Nginx 反向代理（带身份验证）

使用 HTTP 身份验证保护 Chrome 调试：

**/etc/nginx/sites-available/chrome-remote：**
```nginx
server {
    listen 80;
    server_name chrome.example.com;

    # 基本身份验证
    auth_basic "Chrome Remote Debugging";
    auth_basic_user_file /etc/nginx/.htpasswd;

    location / {
        proxy_pass http://localhost:9222;
        proxy_http_version 1.1;
        proxy_set_header Upgrade $http_upgrade;
        proxy_set_header Connection "upgrade";
        proxy_set_header Host $host;
        proxy_set_header X-Real-IP $remote_addr;
        proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
        proxy_read_timeout 86400;
    }
}
```

**设置：**
```bash
# 创建密码文件
sudo htpasswd -c /etc/nginx/.htpasswd admin

# 启用站点
sudo ln -s /etc/nginx/sites-available/chrome-remote /etc/nginx/sites-enabled/
sudo nginx -t
sudo systemctl reload nginx

# 使用身份验证连接
# ws://admin:password@chrome.example.com/devtools/browser/...
```

### 从另一台计算机连接

配置服务器后，从客户端机器连接：

```python
import asyncio
import aiohttp
from pydoll.browser.chromium import Chrome

async def connect_to_remote_server():
    """连接到远程服务器上运行的 Chrome。"""
    # 服务器 IP 和端口
    server_ip = "192.168.1.100"
    server_port = 9222

    async with aiohttp.ClientSession() as session:
        # 查询服务器的可用目标
        url = f"http://{server_ip}:{server_port}/json/version"
        
        async with session.get(url) as response:
            data = await response.json()
            ws_url = data['webSocketDebuggerUrl']
            
            print(f"服务器信息:")
            print(f"  浏览器: {data.get('Browser')}")
            print(f"  协议: {data.get('Protocol-Version')}")
            print(f"  WebSocket: {ws_url}")
    
    # 2. 连接到浏览器
    chrome = Chrome()
    tab = await chrome.connect(ws_url)
    
    print(f"\n[成功] 已连接到远程 Chrome 服务器！")
    
    # 3. 正常使用
    await tab.go_to('https://example.com')
    title = await tab.execute_script('return document.title')
    print(f"页面标题: {title}")
    
    # 4. 清理
    await chrome.close()

asyncio.run(connect_to_remote_server())
```

### 测试服务器设置

```bash
# 1. 检查 Chrome 是否运行
ps aux | grep chrome

# 2. 检查端口是否在监听
netstat -tulpn | grep 9222
# 或
ss -tulpn | grep 9222

# 3. 测试本地访问
curl http://localhost:9222/json/version

# 4. 测试远程访问（从客户端机器）
curl http://SERVER_IP:9222/json/version

# 5. 检查 WebSocket URL
curl http://SERVER_IP:9222/json/version | jq -r '.webSocketDebuggerUrl'

# 6. 列出所有可用目标（标签页/页面）
curl http://SERVER_IP:9222/json/list
```

### 多实例设置

在不同端口上运行多个 Chrome 实例：

```bash
#!/bin/bash
# start-chrome-pool.sh

for port in 9222 9223 9224 9225; do
    google-chrome \
        --remote-debugging-port=$port \
        --remote-debugging-address=0.0.0.0 \
        --headless=new \
        --no-sandbox \
        --disable-dev-shm-usage \
        --user-data-dir=/tmp/chrome-$port &
    
    echo "在端口 $port 上启动了 Chrome"
done

echo "Chrome 池已就绪。端口: 9222-9225"
```

**使用池的 Python 客户端：**
```python
import asyncio
from pydoll.browser.chromium import Chrome
import aiohttp

async def connect_to_pool(server_ip: str, ports: list[int]):
    """连接到多个 Chrome 实例。"""
    tasks = []
    
    for port in ports:
        task = connect_to_instance(server_ip, port)
        tasks.append(task)
    
    results = await asyncio.gather(*tasks)
    return results

async def connect_to_instance(server_ip: str, port: int):
    """连接到单个 Chrome 实例。"""
    # 获取 WebSocket URL
    async with aiohttp.ClientSession() as session:
        url = f"http://{server_ip}:{port}/json/version"
        async with session.get(url) as response:
            data = await response.json()
            ws_url = data['webSocketDebuggerUrl']
    
    # 连接
    chrome = Chrome()
    tab = await chrome.connect(ws_url)
    
    # 运行自动化
    await tab.go_to('https://example.com')
    title = await tab.execute_script('return document.title')
    
    print(f"端口 {port}: {title}")
    
    await chrome.close()
    return title

# 用法
asyncio.run(connect_to_pool('192.168.1.100', [9222, 9223, 9224, 9225]))
```

## 连接方法

Pydoll 提供两种远程连接方法，每种都适合不同的场景。

### 方法 1：浏览器级连接

使用 WebSocket 端点连接到运行中的浏览器并访问所有打开的标签页：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def connect_to_remote_browser():
    chrome = Chrome()
    
    # 通过 WebSocket 连接到远程浏览器
    tab = await chrome.connect('ws://localhost:9222/devtools/browser/XXXX')
    
    # 返回的标签页是第一个可用的标签页
    print(f"已连接到标签页: {await tab.execute_script('return document.title')}")
    
    # 您也可以获取所有其他标签页
    all_tabs = await chrome.get_opened_tabs()
    print(f"可用的标签页总数: {len(all_tabs)}")
    
    # 正常使用标签页
    await tab.go_to('https://example.com')
    element = await tab.find(id='main-content')
    text = await element.text
    print(f"内容: {text}")
    
    # 清理
    await chrome.close()

asyncio.run(connect_to_remote_browser())
```

!!! tip "获取 WebSocket URL"
    启动启用了调试的 Chrome：
    ```bash
    # Linux/Mac
    google-chrome --remote-debugging-port=9222
    
    # Windows
    "C:\Program Files\Google\Chrome\Application\chrome.exe" --remote-debugging-port=9222
    ```
    
    **对于本地连接**（同一台机器）：
    
    - 在浏览器中访问 `http://localhost:9222/json/version` 以在 `webSocketDebuggerUrl` 字段中获取 WebSocket URL
    - 或使用 `aiohttp` 以编程方式查询它，如上面的示例所示
    - 对于快速调试，您还可以在启动本地浏览器实例后检查 `browser._connection_port`
    
    **对于远程连接**（不同机器）：
    
    - 从客户端机器查询 `http://SERVER_IP:9222/json/version`
    - 使用响应中的 `webSocketDebuggerUrl`，如果需要，将 `localhost` 替换为实际服务器 IP

### 方法 2：直接元素控制（混合方法）

如果您已经有自己的 CDP 集成或低级工具，可以用 Pydoll 的高级 API 包装现有元素：

```python
import asyncio
import json
from pydoll.connection.connection_handler import ConnectionHandler
from pydoll.elements.web_element import WebElement

async def custom_cdp_integration():
    """将 Pydoll 与您的自定义 CDP 实现一起使用。"""
    # 您现有的 CDP 设置已找到一个元素
    page_ws = 'ws://localhost:9222/devtools/page/ABC123'
    
    # 您已使用 Runtime.evaluate 查找元素
    # 并获得了其 objectId
    element_object_id = '{\"injectedScriptId\":1,\"id\":1}'
    
    # 创建 Pydoll 连接
    connection = ConnectionHandler(ws_address=page_ws)
    
    # 包装元素
    button = WebElement(
        object_id=element_object_id,
        connection_handler=connection
    )
    
    # 使用 Pydoll 的高级方法
    await button.wait_until(is_visible=True, timeout=5)
    await button.wait_until(is_interactable=True)
    
    # 使用真实偏移点击
    await button.click(offset_x=5, offset_y=5)
    
    # 轻松获取计算的属性
    is_enabled = await button.is_enabled()
    bounds = await button.bounds
    
    print(f"按钮已点击！启用: {is_enabled}, 边界: {bounds}")
    
    # 清理
    await connection.close()

asyncio.run(custom_cdp_integration())
```

!!! tip "对象 ID 格式"
    `objectId` 是由 CDP 命令（如 `Runtime.evaluate` 或 `DOM.resolveNode`）返回的字符串。它通常是一个带有 `injectedScriptId` 和 `id` 等字段的 JSON 字符串。

!!! info "两全其美"
    这种混合方法让您利用现有的 CDP 基础设施，同时受益于 Pydoll 的人性化元素 API 来进行交互、等待和属性访问。

## 安全注意事项

!!! danger "生产环境"
    远程调试端口暴露了对浏览器的**完全控制**，包括：
    
    - 访问所有页面和数据
    - 执行任意 JavaScript 的能力
    - Cookie 和会话访问
    - 通过下载访问文件系统
    
    **未经适当的身份验证和网络安全，切勿将调试端口暴露到互联网！**

### 推荐的安全实践

| 实践 | 原因 | 如何做 |
|----------|-----|-----|
| **SSH 隧道** | 加密流量并进行身份验证 | `ssh -L 9222:localhost:9222 user@host` |
| **VPN** | 网络级安全 | 通过企业/私有 VPN 连接 |
| **防火墙规则** | 限制访问 | 仅允许特定 IP |
| **Docker 网络** | 容器隔离 | 使用私有 Docker 网络 |
| **不公开暴露** | 防止攻击 | 在生产环境中切勿绑定到 `0.0.0.0` |

## 进一步阅读

- **[事件系统](event-system.md)** - 监控远程浏览器事件
- **[网络监控](../network/monitoring.md)** - 跟踪远程浏览器中的请求
- **[浏览器选项](../configuration/browser-options.md)** - 在启动前配置本地浏览器

!!! tip "从本地开始，远程扩展"
    使用 `browser.start()` 在本地开发自动化以进行快速迭代，然后使用 `browser.connect()` 部署到生产 CI/CD 管道和容器化环境。

================================================
FILE: docs/zh/features/automation/file-operations.md
================================================
# 文件操作

文件上传是浏览器自动化中最具挑战性的方面之一。传统工具经常难以处理操作系统级别的文件对话框，需要复杂的解决方法或外部库。Pydoll 提供两种直接的文件上传方法，每种都适合不同的场景。

## 上传方法

Pydoll 支持两种主要的文件上传方法：

1. **直接文件输入**（`set_input_files()`）：快速直接，适用于 `<input type="file">` 元素
2. **文件选择器上下文管理器**（`expect_file_chooser()`）：拦截文件对话框，适用于任何上传触发器

## 直接文件输入

最简单的方法是直接在文件输入元素上使用 `set_input_files()`。这种方法快速、可靠，并完全绕过操作系统文件对话框。

### 基本用法

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def direct_file_upload():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/upload')
        
        # 查找文件输入元素
        file_input = await tab.find(tag_name='input', type='file')
        
        # 直接设置文件
        file_path = Path('path/to/document.pdf')
        await file_input.set_input_files(file_path)
        
        # 提交表单
        submit_button = await tab.find(id='submit-button')
        await submit_button.click()
        
        print("文件上传成功！")

asyncio.run(direct_file_upload())
```

!!! tip "Path 与字符串"
    虽然推荐使用 `pathlib` 中的 `Path` 对象作为最佳实践，以获得更好的路径处理和跨平台兼容性，但如果您喜欢，也可以使用纯字符串：
    ```python
    await file_input.set_input_files('path/to/document.pdf')  # 也可以！
    ```

### 多个文件

对于接受多个文件的输入（`<input type="file" multiple>`），传递文件路径列表：

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def upload_multiple_files():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/multi-upload')
        
        file_input = await tab.find(tag_name='input', type='file')
        
        # 一次上传多个文件
        files = [
            Path('documents/report.pdf'),
            Path('images/screenshot.png'),
            Path('data/results.csv')
        ]
        await file_input.set_input_files(files)
        
        # 正常处理
        upload_btn = await tab.find(id='upload-btn')
        await upload_btn.click()

asyncio.run(upload_multiple_files())
```

### 动态路径解析

`Path` 对象使动态构建路径和处理跨平台兼容性变得容易：

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def upload_with_dynamic_paths():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/upload')
        
        file_input = await tab.find(tag_name='input', type='file')
        
        # 动态构建路径
        project_dir = Path(__file__).parent
        file_path = project_dir / 'uploads' / 'data.json'

        await file_input.set_input_files(file_path)
        # 或使用主目录
        user_file = Path.home() / 'Documents' / 'report.pdf'
        await file_input.set_input_files(user_file)

asyncio.run(upload_with_dynamic_paths())
```

!!! tip "何时使用直接文件输入"
    在以下情况下使用 `set_input_files()`：
    
    - 文件输入在 DOM 中可直接访问
    - 您想要最大的速度和简单性
    - 上传不会触发文件选择器对话框
    - 您正在使用标准的 `<input type="file">` 元素

## 文件选择器上下文管理器

某些网站隐藏文件输入并使用自定义按钮或拖放区域来触发操作系统文件选择器对话框。对于这些情况，使用 `expect_file_chooser()` 上下文管理器。

### 工作原理

`expect_file_chooser()` 上下文管理器：

1. 启用文件选择器拦截
2. 等待文件选择器对话框打开
3. 在对话框出现时自动设置文件
4. 在操作完成后清理

### 基本用法

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def file_chooser_upload():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/custom-upload')
        
        # 准备文件路径
        file_path = Path.cwd() / 'document.pdf'
        
        # 使用上下文管理器处理文件选择器
        async with tab.expect_file_chooser(files=file_path):
            # 点击自定义上传按钮
            upload_button = await tab.find(class_name='custom-upload-btn')
            await upload_button.click()
            # 对话框打开时文件自动设置
        
        # 继续您的自动化
        print("通过选择器选择的文件！")

asyncio.run(file_chooser_upload())
```

### 使用文件选择器的多个文件

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def multiple_files_chooser():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/gallery-upload')
        
        # 准备多个文件
        photos_dir = Path.home() / 'photos'
        files = [
            photos_dir / 'img1.jpg',
            photos_dir / 'img2.jpg',
            photos_dir / 'img3.jpg'
        ]
        
        async with tab.expect_file_chooser(files=files):
            # 通过自定义按钮触发上传
            add_photos_btn = await tab.find(text='Add Photos')
            await add_photos_btn.click()
        
        print(f"已选择 {len(files)} 个文件！")

asyncio.run(multiple_files_chooser())
```

### 动态文件选择

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def dynamic_file_selection():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/batch-upload')
        
        # 使用 Path.glob() 查找目录中的所有 CSV 文件
        data_dir = Path('data')
        csv_files = list(data_dir.glob('*.csv'))
        
        async with tab.expect_file_chooser(files=csv_files):
            upload_area = await tab.find(class_name='drop-zone')
            await upload_area.click()
        
        print(f"已选择 {len(csv_files)} 个 CSV 文件")

asyncio.run(dynamic_file_selection())
```

!!! tip "何时使用文件选择器"
    在以下情况下使用 `expect_file_chooser()`：
    
    - 文件输入被隐藏或不可直接访问
    - 自定义按钮触发文件选择器对话框
    - 使用拖放上传区域
    - 站点使用 JavaScript 打开文件对话框

## 比较：直接与文件选择器

| 特性 | `set_input_files()` | `expect_file_chooser()` |
|---------|---------------------|-------------------------|
| **速度** | ⚡ 即时 | 🕐 等待对话框 |
| **复杂性** | 简单 | 需要上下文管理器 |
| **要求** | 可见的文件输入 | 任何上传触发器 |
| **用例** | 标准表单 | 自定义上传 UI |
| **事件处理** | 不需要 | 使用页面事件 |

## 完整示例

这是一个结合两种方法的综合示例：

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def comprehensive_upload_example():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/upload-form')
        
        # 场景 1：个人资料图片的直接输入（单个文件）
        avatar_input = await tab.find(id='avatar-upload')
        avatar_path = Path.home() / 'Pictures' / 'profile.jpg'
        await avatar_input.set_input_files(avatar_path)
        
        # 等待预览加载
        await asyncio.sleep(1)
        
        # 场景 2：文档上传的文件选择器
        document_path = Path.cwd() / 'documents' / 'resume.pdf'
        async with tab.expect_file_chooser(files=document_path):
            # 触发文件选择器的自定义样式按钮
            upload_btn = await tab.find(class_name='btn-upload-document')
            await upload_btn.click()
        
        # 等待上传确认
        await asyncio.sleep(2)
        
        # 场景 3：通过文件选择器的多个文件
        certs_dir = Path('certs')
        certificates = [
            certs_dir / 'certificate1.pdf',
            certs_dir / 'certificate2.pdf',
            certs_dir / 'certificate3.pdf'
        ]
        async with tab.expect_file_chooser(files=certificates):
            add_certs_btn = await tab.find(text='Add Certificates')
            await add_certs_btn.click()
        
        # 提交完整表单
        submit_button = await tab.find(type='submit')
        await submit_button.click()
        
        # 等待成功消息
        success_msg = await tab.find(class_name='success-message', timeout=10)
        message_text = await success_msg.text
        print(f"上传结果: {message_text}")

asyncio.run(comprehensive_upload_example())
```

!!! info "方法摘要"
    此示例演示了 Pydoll 文件上传系统的灵活性：
    
    - **单个文件**：直接传递 `Path` 或 `str`（不需要列表）
    - **多个文件**：传递 `Path` 或 `str` 对象的列表
    - **直接输入**：对可见的 `<input>` 元素快速
    - **文件选择器**：适用于自定义上传按钮和隐藏输入

## 了解更多

要更深入地了解文件上传机制：

- **[事件系统](../advanced/event-system.md)**：了解 `expect_file_chooser()` 使用的页面事件
- **[深入探讨：Tab 域](../../deep-dive/tab-domain.md#file-chooser-handling)**：文件选择器拦截的技术细节
- **[深入探讨：事件系统](../../deep-dive/event-system.md#file-chooser-events)**：文件选择器事件如何在底层工作

Pydoll 中的文件操作消除了浏览器自动化中最大的痛点之一，为简单和复杂的上传场景提供了干净、可靠的方法。

================================================
FILE: docs/zh/features/automation/human-interactions.md
================================================
# 类人交互

成功自动化与易被识破的机器人之间的关键区别之一在于交互的逼真程度。Pydoll提供精密工具，使您的自动化操作几乎与人类行为无异。

!!! info "功能状态"
    **已实现:**

    - **人性化键盘**: 可变输入速度，真实错误与自动纠正（传入 `humanize=True`）
    - **人性化滚动**: 基于物理的滚动，包含动量、摩擦、抖动和过冲（传入 `humanize=True`）
    - **人性化鼠标**: 贝塞尔曲线路径、菲茨定律时序、最小急动速度、手抖和过冲（传入 `humanize=True`）

    **即将推出:**

    - **自动随机点击偏移**: 可选参数自动随机化元素内点击位置
    - **悬停行为**: 悬停时的真实延迟与移动效果

## 拟人化交互为何重要

现代网站采用精密的机器人检测技术：

- **事件时间分析**：识别超高速或精准定时操作
- **鼠标轨迹追踪**：识别直线移动或瞬移行为
- **键盘输入模式**：识别无单个按键操作的即时文本插入
- **点击位置**：检测始终精准落在元素中心的点击
- **操作序列**：识别用户行为中的非人类模式

Pydoll通过提供模拟真实用户行为的交互方法，助您规避检测。

## 逼真鼠标移动

鼠标API（`tab.mouse`）提供多层逼真效果的人性化光标控制。启用`humanize=True`时，鼠标移动遵循自然贝塞尔曲线路径，配合菲茨定律时序、最小急动速度曲线、生理性手抖和过冲修正。

```python
from pydoll.browser.chromium import Chrome

async with Chrome() as browser:
    tab = await browser.start()
    await tab.go_to('https://example.com')

    # 以自然曲线路径移动
    await tab.mouse.move(500, 300, humanize=True)

    # 以逼真的移动、偏移和时序点击
    await tab.mouse.click(500, 300, humanize=True)

    # 以自然移动拖拽
    await tab.mouse.drag(100, 200, 500, 400, humanize=True)
```

人性化鼠标操作中应用的关键技术：

- **贝塞尔曲线路径**：具有非对称控制点的曲线轨迹（移动初期曲率更大）
- **菲茨定律时序**：移动持续时间随距离缩放：`MT = a + b × log₂(D/W + 1)`
- **最小急动速度**：钟形速度曲线，起始缓慢、中间达到峰值、结尾缓慢
- **生理性手抖**：高斯噪声（σ ≈ 1像素）与速度成反比
- **过冲与修正**：快速移动约70%概率过冲3–12%，然后修正回来
!!! info "鼠标控制专用文档"
    有关鼠标控制的完整文档，包括所有方法、自定义时序配置、位置追踪和调试模式，请参阅**[鼠标控制](mouse-control.md)**。

## 真实点击模拟

### 基础点击：模拟鼠标事件

`click()`方法模拟真实的鼠标按下与释放事件，区别于基于JavaScript的点击方式：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def realistic_clicking():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to(‘https://example.com’)
        
        button = await tab.find(id=“submit-button”)
        
        # 基础真实点击
        await button.click()
        
        # 点击包含：
        # - 鼠标移动至元素
        # - 鼠标按下事件
        # - 可配置按压时长
        # - 鼠标释放事件

asyncio.run(realistic_clicking())
```

### 带位置偏移的点击

真实用户很少精确点击元素中心。使用偏移量改变点击位置：

!!! info “当前状态：手动偏移计算”
    目前每次交互需手动计算并随机化点击偏移量。未来版本将提供可选参数，支持在元素边界内自动随机化点击位置。

```python
import asyncio
import random
from pydoll.browser.chromium import Chrome

async def click_with_offset():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to(‘https://example.com/form’)
        
        submit_button = await tab.find(tag_name=“button”, type="submit")
        
        # 点击位置略偏离中心（更自然）
        await submit_button.click(
            x_offset=5,   # 中心右偏5像素
            y_offset=-3   # 中心上偏3像素
        )
        
        # 当前方案：每次点击手动调整偏移量以模拟人类行为
        for item in await tab.find(class_name=“clickable-item”, find_all=True):
            offset_x = random.randint(-10, 10)
            offset_y = random.randint(-10, 10)
            await item.click(x_offset=offset_x, y_offset=offset_y)
            await asyncio.sleep(random.uniform(0.5, 2.0))

asyncio.run(click_with_offset())
```

可调点击按压时长

通过调整鼠标按键按压时长模拟不同点击方式：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def variable_hold_time():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to(‘https://example.com’)
        
        button = await tab.find(class_name=“action-button”)
        
        # 快速点击（默认0.1秒）
        await button.click(hold_time=0.05)
        
        # 正常点击
        await button.click(hold_time=0.1)
        
        # 更慢、更刻意点击
        await button.click(hold_time=0.2)
        
        # 模拟用户犹豫
        await asyncio.sleep(0.8)
        await button.click(hold_time=0.15)

asyncio.run(variable_hold_time())
```

### 何时使用click()与click_using_js()

理解两者差异对规避检测至关重要：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def click_methods_comparison():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to(‘https://example.com’)
        
        button = await tab.find(id=“interactive-button”)
        
        # 方法1：click() - 模拟真实鼠标事件
        # ✅ 触发全部鼠标事件（按下、松开、点击）
        # ✅ 保持元素定位
        # ✅ 更逼真且更难被检测
        # ❌ 需元素可见且在视口内
        await button.click()
        
        # 方法二：click_using_js() - 使用 JavaScript 的 click()
        # ✅ 可作用于隐藏元素
        # ✅ 执行速度更快
        # ✅ 绕过视觉覆盖层
        # ❌ 可能被识别为自动化操作
        # ❌ 无法触发与真实用户相同的事件序列
        await button.click_using_js()

asyncio.run(click_methods_comparison())
```

!!! 提示 “最佳实践：优先使用鼠标事件”
    用户交互场景请使用`click()`以保持真实感。仅在后端操作、隐藏元素或追求速度且无需规避检测时使用`click_using_js()`。

## 逼真文本输入

Pydoll的键盘API提供两种输入模式，平衡速度与隐蔽性。

!!! info "了解输入模式"
    | 模式 | 参数 | 行为 | 使用场景 |
    |------|------|------|----------|
    | **默认（快速）** | `humanize=False` | 固定50毫秒间隔，无错误 | 速度优先、低风险场景（默认） |
    | **人性化** | `humanize=True` | 可变时序，约2%错误率并自动纠正 | **反机器人规避** |

    `interval`参数已弃用。传入`humanize=True`进行真实输入。

### 人性化自然输入

当传入`humanize=True`时，`type_text()`使用人性化模式，模拟真实人类输入，包含可变速度和自动纠正的偶发错误：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def natural_typing():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/login')
        
        username_field = await tab.find(id="username")
        password_field = await tab.find(id="password")

        # 可变速度：按键间隔30-120毫秒
        # 约2%错误率，带真实纠正行为
        await username_field.type_text("john.doe@example.com", humanize=True)
        await password_field.type_text("MyC0mpl3xP@ssw0rd!", humanize=True)

asyncio.run(natural_typing())
```

### 不可见字段的快速输入

对于无需真实模拟的字段（如隐藏字段或后端操作），使用`insert_text()`：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def fast_vs_realistic_input():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to(‘https://example.com/form’)
        
        # 可见字段的真实输入
        username = await tab.find(id=“username”)
        await username.click()
        await username.type_text(“john_doe”, interval=0.12)
        
        # 隐藏/后台字段的快速插入
        hidden_field = await tab.find(id=“hidden-token”)
        await hidden_field.insert_text(“very-long-generated-token-12345678”)
        
        # 关键字段采用真实输入模拟
        comment = await tab.find(id=“comment-box”)
        await comment.click()
        await comment.type_text(“This looks like human input!”, interval=0.15)

asyncio.run(fast_vs_realistic_input())
```

!!! info “高级键盘控制”
    有关全面的键盘控制文档（包括特殊键、组合键、修饰键及完整键位参考表），请参阅**[键盘控制](keyboard-control.md)**。

## 逼真页面滚动

Pydoll提供专用滚动API，在继续执行前等待滚动完成，使您的自动化更加真实可靠。

!!! info "了解滚动模式"
    Pydoll的滚动API提供**三种不同模式**：

    | 模式 | 参数 | 行为 | 使用场景 |
    |------|------|------|----------|
    | **平滑（默认）** | `smooth=True` | CSS动画，可预测 | 一般浏览模拟（默认） |
    | **人性化** | `humanize=True` | 物理引擎：动量、抖动、过冲 | **反机器人规避** |
    | **即时** | `smooth=False` | 立即传送到目标位置 | 速度优先场景 |

    传入`humanize=True`以启用基于物理的人性化滚动来规避机器人检测。

### 基础方向滚动

使用`scroll.by()`方法精确控制页面任意方向的滚动：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.constants import ScrollPosition

async def basic_scrolling():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/long-page')
        
        # 人性化 - 贝塞尔曲线物理引擎
        # 包含：动量、摩擦、抖动、微停顿、过冲
        await tab.scroll.by(ScrollPosition.DOWN, 500, humanize=True)
        await tab.scroll.by(ScrollPosition.UP, 300, humanize=True)

        # CSS动画 - 外观平滑但时序可预测
        await tab.scroll.by(ScrollPosition.DOWN, 500, humanize=False, smooth=True)

        # 即时传送 - 最快但易被检测
        await tab.scroll.by(ScrollPosition.DOWN, 1000, humanize=False, smooth=False)

asyncio.run(basic_scrolling())
```

### 滚动至特定位置

导航至页面顶部或底部，可控制逼真程度：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def scroll_to_positions():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/article')
        
        # 阅读文章开头
        await asyncio.sleep(2.0)
        
        # 人性化滚动（物理引擎，反机器人）
        await tab.scroll.to_bottom(humanize=True)
        await asyncio.sleep(1.5)
        await tab.scroll.to_top(humanize=True)

        # CSS平滑滚动（可预测动画）
        await tab.scroll.to_bottom(humanize=False, smooth=True)
        await asyncio.sleep(1.5)
        await tab.scroll.to_top(humanize=False, smooth=True)

asyncio.run(scroll_to_positions())
```

!!! tip "选择正确的模式"
    - **`humanize=True`**：反机器人规避的最佳选择
    - **默认** (`smooth=True`)：适用于演示、截图和一般自动化
    - **`smooth=False`**：隐蔽性不重要时追求最大速度

### 类人滚动模式

Pydoll的滚动引擎使用**三次贝塞尔曲线**模拟人类滚动的物理特性，包括：

- **动量**：初始速度爆发后逐渐减速
- **摩擦**：基于"物理阻力"的自然减速
- **微停顿**：长距离滚动时的短暂停顿，模拟阅读或眼球移动
- **过冲**：偶尔滚动超过目标后回调

使用`humanize=True`时自动启用此行为。

```python
import asyncio
import random
from pydoll.browser.chromium import Chrome
from pydoll.constants import ScrollPosition

async def human_like_scrolling():
    """模拟阅读文章时的自然滚动模式。"""
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/article')
        
        # 用户从顶部开始阅读
        await asyncio.sleep(random.uniform(2.0, 4.0))
        
        # 阅读时逐步滚动
        # 滚动引擎处理物理效果（加速/减速）
        for _ in range(random.randint(5, 8)):
            # 变化滚动距离（模拟阅读速度）
            scroll_distance = random.randint(300, 600)
            await tab.scroll.by(
                ScrollPosition.DOWN, 
                scroll_distance, 
                humanize=True  # 启用贝塞尔曲线物理
            )
            
            # 停顿"阅读"内容
            await asyncio.sleep(random.uniform(2.0, 5.0))
        
        # 快速滚动查看末尾
        await tab.scroll.to_bottom(humanize=True)
        await asyncio.sleep(random.uniform(1.0, 2.0))
        
        # 滚回顶部重读某处
        await tab.scroll.to_top(humanize=True)

asyncio.run(human_like_scrolling())
```

### 将元素滚动至可见区

使用`scroll_into_view()`确保元素在截取页面屏幕截图前可见：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def scroll_for_screenshots():
    """截取页面屏幕截图前将元素滚动至可见区。"""
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/product')
        
        # 截取完整页面屏幕截图前滚动至价格部分
        pricing_section = await tab.find(id="pricing")
        await pricing_section.scroll_into_view()
        await tab.take_screenshot(path="page_with_pricing.png")
        
        # 截图前滚动至评论区
        reviews = await tab.find(class_name="reviews")
        await reviews.scroll_into_view()
        await tab.take_screenshot(path="page_with_reviews.png")
        
        # 滚动至页脚以捕获完整页面状态
        footer = await tab.find(tag_name="footer")
        await footer.scroll_into_view()
        await tab.take_screenshot(path="page_with_footer.png")
        
        # 注意：click()已自动滚动，因此无需：
        # await button.scroll_into_view()  # 多余！
        # await button.click()  # 此操作已将按钮滚动至可见区

asyncio.run(scroll_for_screenshots())
```

### 处理无限滚动内容

实现滚动模式加载延迟加载的内容：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.constants import ScrollPosition

async def infinite_scroll_loading():
    """在无限滚动页面上加载内容。"""
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/feed')
        
        items_loaded = 0
        max_scrolls = 10
        
        for scroll_num in range(max_scrolls):
            # 滚动至底部触发加载
            await tab.scroll.to_bottom(smooth=True)
            
            # 等待内容加载
            await asyncio.sleep(random.uniform(2.0, 3.0))
            
            # 检查是否加载新项目
            items = await tab.find(class_name="feed-item", find_all=True)
            new_count = len(items)
            
            if new_count == items_loaded:
                print("无更多内容可加载")
                break
            
            items_loaded = new_count
            print(f"滚动 {scroll_num + 1}：已加载 {items_loaded} 项")
            
            # 小幅向上滚动（人类行为）
            if random.random() > 0.7:
                await tab.scroll.by(ScrollPosition.UP, 200, smooth=True)
                await asyncio.sleep(random.uniform(0.5, 1.0))

asyncio.run(infinite_scroll_loading())
```

!!! success "自动等待完成"
    不同于立即返回的`execute_script("window.scrollBy(...)")`，`scroll` API使用CDP的`awaitPromise`参数等待浏览器的`scrollend`事件。这确保后续操作仅在滚动完全完成后执行。

## 组合技术实现最高逼真度

### 完整表单填写示例

以下综合示例融合了所有类人交互技术。**这展示了当前手动实现最高逼真度的方案**。未来版本将自动化处理大部分随机化操作：


```python
import asyncio
import random
from pydoll.browser.chromium import Chrome
from pydoll.constants import Key

async def human_like_form_filling():
    “”‘以最大真实感填写表单以规避检测’“”
    async with Chrome() as browser:
        tab = await browser.start()
        await 标签页.go_to(‘https://example.com/registration’)
        
        # 等待片刻（模拟用户阅读页面）
        await asyncio.sleep(random.uniform(1.5, 3.0))
        
        # 以随机打字速度填写名字
        名字 = await 标签页.find(id=“first-name”)
        await first_name.click(
            x_offset=random.randint(-5, 5),
            y_offset=random.randint(-5, 5)
        )
        await asyncio.sleep(random.uniform(0.2, 0.5))
        
        # 手动逐字符输入并随机延迟
        # （未来版本将实现自动化）
        name_text = “John”
        for char in name_text:
            await first_name.type_text(char, interval=0)
            await asyncio.sleep(random.uniform(0.08, 0.22))
        
        # 跳转至下一个字段
        await asyncio.sleep(random.uniform(0.3, 0.8))
        await first_name.press_keyboard_key(Key.TAB)
        
        # 填写姓氏
        await asyncio.sleep(random.uniform(0.2, 0.5))
        last_name = await tab.find(id=“last-name”)
        await last_name.type_text(“Doe”, interval=random.uniform(0.1, 0.18))
        
        # 跳转至邮箱字段
        await asyncio.sleep(random.uniform(0.4, 1.0))
        await last_name.press_keyboard_key(Key.TAB)
        
        # 填充邮箱时加入真实停顿
        await asyncio.sleep(random.uniform(0.2, 0.5))
        email = await tab.find(id=“email”)
        
        email_text = “john.doe@example.com”
        for i, char in enumerate(email_text):
            await email.type_text(char, interval=0)
            # 在@和.符号处延长停顿（自然）
            if char in [‘@’, ‘.’]:
                await asyncio.sleep(random.uniform(0.2, 0.4))
            else:
                await asyncio.sleep(random.uniform(0.08, 0.2))
        
        # 模拟用户检查输入内容
        await asyncio.sleep(random.uniform(1.0, 2.5))
        
        # 带偏移量的条款同意复选框
        terms_checkbox = await tab.find(id=“accept-terms”)
        await terms_checkbox.click(
            x_offset=random.randint(-3, 3),
            y_offset=random.randint(-3, 3),
            hold_time=random.uniform(0.08, 0.15)
        )
        
        # 提交前暂停（用户审核表单）
        await asyncio.sleep(random.uniform(1.5, 3.0))
        
        # 模拟真实参数点击提交按钮
        submit_button = await tab.find(tag_name=“button”, type="submit")
        await submit_button.click(
            x_offset=random.randint(-8, 8),
            y_offset=random.randint(-5, 5),
            hold_time=random.uniform(0.1, 0.2)
        )
        
        print(“表单已按人类行为提交”)

asyncio.run(human_like_form_filling())
```

## 规避检测的最佳实践

!!! 提示 “当前需手动随机化”
    以下最佳实践代表**Pydoll的当前状态**，您必须手动实现随机化。虽然这需要更多代码，但能让您精细控制行为。未来版本将自动实现这些模式，同时保持同等逼真度。

### 1. 始终添加随机延迟

```python
import asyncio
import random
from pydoll.browser.chromium import Chrome

# 错误示例：可预测的操作时序
await element1.click()
await element2.click()
await element3.click()

# 良好：可变时序（当前必需）
await element1.click()
await asyncio.sleep(random.uniform(0.5, 1.5))
await element2.click()
await asyncio.sleep(random.uniform(0.8, 2.0))
await element3.click()
```

### 2. 变化点击位置

```python
import asyncio
import random
from pydoll.browser.chromium import Chrome

# 错误示例：始终点击中心位置
for button in buttons:
    await button.click()

# 正确示例：随机变化点击位置（当前需手动设置）
for button in buttons:
    await button.click(
        x_offset=random.randint(-10, 10),
        y_offset=random.randint(-10, 10)
    )
```

### 3. 模拟自然用户行为

```python
import asyncio
import random
from pydoll.browser.chromium import Chrome

async def natural_user_simulation(tab):
    # 用户到达页面
    await tab.go_to(‘https://example.com’)
    
    # 用户阅读页面内容（1-3秒）
    await asyncio.sleep(random.uniform(1.0, 3.0))
    
    # 用户向下滚动查看更多内容
    await tab.scroll.by(ScrollPosition.DOWN, 300, smooth=True)
    await asyncio.sleep(random.uniform(0.5, 1.5))
    
    # 用户找到并点击按钮
    button = await tab.find(class_name=“cta-button”)
    await button.click(
        x_offset=random.randint(-5, 5),
        y_offset=random.randint(-5, 5)
    )
    
    # 用户等待内容加载
    await asyncio.sleep(random.uniform(0.8, 1.5))
```

### 4. 组合多种技术

```python
import asyncio
import random
from pydoll.browser.chromium import Chrome

async def advanced_stealth_automation():
    “”‘组合多种技术实现最大隐蔽性’“”
    async with Chrome() as browser:
    tab = await browser.start()
        
        # 模拟人类等待页面加载
        await tab.go_to(‘https://example.com/sensitive-page’)
        await asyncio.sleep(random.uniform(2.0, 4.0))
        
        # 模拟真实滚动（当前手动实现）
        # 未来版本将提供带惯性效果的专用滚动方法
        for _ in range(random.randint(2, 4)):
            scroll_amount = random.randint(200, 500)
            await tab.execute_script(f“window.scrollBy(0, {scroll_amount})”)
            await asyncio.sleep(random.uniform(0.8, 2.0))
        
        # 超时查找元素（模拟用户搜索）
        target = await tab.find(
            class_name="target-element",
            timeout=random.randint(3, 7)
        )
        
        # 模拟真实点击参数
        await target.click(
            x_offset=random.randint(-12, 12),
            y_offset=random.randint(-8, 8),
            hold_time=random.uniform(0.09, 0.18)
        )
        
        # 人类反应时间
        await asyncio.sleep(random.uniform(0.5, 1.2))

asyncio.run(advanced_stealth_automation())
```

## 性能与逼真度权衡

有时需要在速度与逼真度之间找到平衡：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def balanced_automation():
    """根据场景选择适当的逼真度级别"""
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/scraping-target')
        
        # 阶段1：初始交互（高逼真度）
        # 此时检测系统最为活跃
        login_button = await tab.find(text="Login")
        await asyncio.sleep(random.uniform(1.0, 2.0))
        await login_button.click(
            x_offset=random.randint(-5, 5),
            y_offset=random.randint(-5, 5)
        )
        
        await asyncio.sleep(random.uniform(0.5, 1.0))
        
        username = await tab.find(id="username")
        await username.type_text("user@example.com", interval=0.12)
        
        await asyncio.sleep(random.uniform(0.3, 0.7))
        
        password = await tab.find(id="password")
        await password.type_text("password123", interval=0.10)
        
        submit = await tab.find(type="submit")
        await asyncio.sleep(random.uniform(0.8, 1.5))
        await submit.click()
        
        # 阶段2：已认证数据提取（低逼真度，高速度）
        # 成功认证后受审查较少
        await asyncio.sleep(2)
        
        # 快速浏览页面
        items = await tab.find(class_name="data-item", find_all=True)
        
        for item in items:
            # 无偏移量快速点击
            await item.click_using_js()
            await asyncio.sleep(0.3)  # 最小延迟
            
            # 提取数据
            title = await tab.find(class_name="title")
            data = await title.text
            
            # 快速导航
            await tab.execute_script("window.history.back()")
            await asyncio.sleep(0.5)

asyncio.run(balanced_automation())
```

## 监控与调整

测试自动化操作的逼真度：

```python
import asyncio
import random
import time
from pydoll.browser.chromium import Chrome

async def test_interaction_timing():
    """记录时序以确保逼真的行为模式"""
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/test-page')
        
        # 测量并记录交互时序
        elements = await tab.find(class_name="clickable", find_all=True)
        
        timings = []
        last_time = time.time()
        
        for i, element in enumerate(elements):
            await element.click(
                x_offset=random.randint(-8, 8),
                y_offset=random.randint(-8, 8)
            )
            
            current_time = time.time()
            elapsed = current_time - last_time
            timings.append(elapsed)
            
            print(f"点击 {i+1}: 距上次操作 {elapsed:.3f}秒")
            last_time = current_time
            
            await asyncio.sleep(random.uniform(0.5, 2.0))
        
        # 分析时序分布
        avg_time = sum(timings) / len(timings)
        print(f"\n操作间平均时间: {avg_time:.3f}秒")
        print(f"最小值: {min(timings):.3f}秒, 最大值: {max(timings):.3f}秒")
        
        # 良好：可变时序且平均时间逼真（1-2秒）
        # 不佳：恒定时序或速度不真实（<0.1秒）

asyncio.run(test_interaction_timing())
```

## 了解更多

有关元素交互方法的更多信息：

- **[元素查找](../element-finding.md)**：定位需要交互的元素
- **[WebElement域](../../deep-dive/architecture/webelement-domain.md)**：深入了解WebElement功能
- **[文件操作](file-operations.md)**：上传文件和处理下载

掌握类人交互技术，您的自动化将更可靠、更难检测，并更贴近真实用户行为。


================================================
FILE: docs/zh/features/automation/iframes.md
================================================
# 处理 IFrame

现代网页经常使用 `<iframe>` 嵌入其他文档。旧版本的 Pydoll 需要手动调用 `tab.get_frame()` 把 iframe 转成 `Tab` 并管理 CDP target。**现在不再需要这样做。**  
iframe 现在和其他 `WebElement` 一样：可以直接调用 `find()`、`query()`、`execute_script()`、`inner_html`、`text` 等方法，Pydoll 会自动在正确的浏览上下文中执行（无论是否跨域）。

!!! info "更轻松的心智模型"
    把 iframe 当成页面上的普通 `div`。找到它后，就以它为起点继续查找内部元素。Pydoll 会自动创建隔离执行环境，缓存上下文，并处理多层嵌套。

## 快速入门

### 与页面上的第一个 iframe 交互

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def interact_with_iframe():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/page-with-iframe')

        iframe = await tab.find(tag_name='iframe', id='content-frame')

        # 以下调用都会在 iframe 内部执行
        title = await iframe.find(tag_name='h1')
        await title.click()

        form = await iframe.find(id='login-form')
        username = await form.find(name='username')
        await username.type_text('john_doe')

asyncio.run(interact_with_iframe())
```

### 多层 iframe

逐层查找即可：

```python
outer = await tab.find(id='outer-frame')
inner = await outer.find(tag_name='iframe')  # 在外层 iframe 内继续查找

submit_button = await inner.find(id='submit')
await submit_button.click()
```

流程始终相同：

1. 找到需要的 iframe 元素。
2. 使用该 `WebElement` 作为新的查找范围。
3. 如果还有内层 iframe，重复以上步骤。

### 在 iframe 中执行 JavaScript

```python
iframe = await tab.find(tag_name='iframe')
result = await iframe.execute_script('return document.title', return_by_value=True)
print(result['result']['result']['value'])
```

Pydoll 会自动在 iframe 的隔离上下文中执行脚本，同样适用于跨域 iframe。

## 为什么这样更好？

- **直观：** DOM 树是什么样子，就怎么编写脚本。
- **无需了解 CDP 细节：** 隔离世界、执行上下文、target 缓存全部由 Pydoll 处理。
- **天然支持嵌套：** 每次查找都以当前元素为范围，多层结构依然清晰。
- **统一 API：** 不再需要在 `Tab` 与 `WebElement` 方法之间切换。

!!! tip "`Tab.get_frame()` 将被移除"
    现在调用 `Tab.get_frame()` 会抛出 `DeprecationWarning`，并将在未来版本删除。请尽快改为直接使用 iframe 元素。

## 常见模式

### 截取 iframe 内部元素的截图

```python
iframe = await tab.find(tag_name='iframe')
chart = await iframe.find(id='sales-chart')
await chart.take_screenshot('chart.png')
```

### 遍历多个 iframe

```python
iframes = await tab.find(tag_name='iframe', find_all=True)
for frame in iframes:
    heading = await frame.find(tag_name='h2')
    print(await heading.text)
```

### 等待 iframe 内容加载

```python
iframe = await tab.find(tag_name='iframe')
await iframe.wait_until(is_visible=True, timeout=10)
banner = await iframe.find(id='promo-banner')
```

## 跨 iframe 选择器

无需手动逐个查找 iframe 再在其中搜索，您可以编写一个**单一选择器**来跨越 iframe 边界。Pydoll 会自动检测 XPath 或 CSS 选择器中的 `iframe` 步骤，将其拆分为片段，并依次遍历 iframe 链。

### CSS 选择器

在 `iframe` 复合选择器后使用任意标准组合器（`>`、空格）：

```python
# 单个 iframe 穿越
button = await tab.query('iframe > .submit-btn')

# iframe 上带属性选择器
button = await tab.query('iframe[src*="checkout"] > #pay-button')

# 嵌套 iframe
element = await tab.query('iframe.outer > iframe.inner > div.content')

# iframe 后的多步查找
link = await tab.query('iframe > nav > a.home-link')

# iframe 在其他元素内部（不在根位置）
button = await tab.query('div > iframe > button.submit')
content = await tab.query('.wrapper iframe > div.content')
```

### XPath 表达式

在 `iframe` 步骤后使用 `/` —— Pydoll 会在 iframe 节点处拆分：

```python
# 单个 iframe 穿越
button = await tab.query('//iframe/body/button[@id="submit"]')

# iframe 在其他元素内部（不在根位置）
div = await tab.query('//div/iframe/div')
item = await tab.query('//div[@class="wrapper"]/iframe/body/div')

# iframe 上带谓词
heading = await tab.query('//iframe[@src*="cloudflare"]//h1')

# 嵌套 iframe
element = await tab.query('//iframe[@id="outer"]//iframe[@id="inner"]//div')
```

### 工作原理

当 Pydoll 遇到类似 `iframe[src*="checkout"] > form > button` 的选择器时：

1. **解析**选择器为片段：`iframe[src*="checkout"]` 和 `form > button`
2. 使用第一个片段**查找** iframe 元素
3. 使用第二个片段**在 iframe 内部搜索**
4. 对于嵌套 iframe，在每个边界重复此过程

这等同于手动方式，但只需一次调用：

```python
# 手动方式（仍然有效）
iframe = await tab.find(tag_name='iframe', src='*checkout*')
button = await iframe.query('form > button')

# 自动方式（相同结果，一行代码）
button = await tab.query('iframe[src*="checkout"] > form > button')
```

### 不进行拆分的情况

只有当 `iframe` 作为**标签名**出现时才会进行拆分。以下选择器保持不变：

- `.iframe > body` —— 类选择器，不是标签
- `#iframe > body` —— ID 选择器
- `div.iframe > body` —— 标签是 `div`，不是 `iframe`
- `[data-type="iframe"] > body` —— 属性选择器
- `iframe` 或 `//iframe` —— iframe 后无内容（没有需要搜索的内容）

### find_all 支持

最后一个片段支持 `find_all=True`，返回最终 iframe 内所有匹配的元素：

```python
# 获取 iframe 内的所有链接
links = await tab.query('iframe > a', find_all=True)
```

## 最佳实践

- **把 iframe 作为作用域：** 在 iframe `WebElement` 上调用 `find`、`query`、`execute_script` 等方法。
- **避免 `tab.find` 查找内部元素：** 它只能访问顶级文档。
- **复用引用：** Pydoll 会缓存 iframe 的上下文，可重复使用。
- **现有工作流保持一致：** 滚动、截图、等待、脚本执行、读取属性等操作与普通元素完全一致。

## 延伸阅读

- **[元素查找](../element-finding.md)** —— 介绍查找范围与链式查询。
- **[截图与 PDF](screenshots-and-pdfs.md)** —— 讲解如何获取视觉输出。
- **[事件系统](../advanced/event-system.md)** —— 以事件驱动方式监听页面变化（包括 iframe）。

在新模型下，iframe 不再是“特殊情况”。把它视为普通 DOM 节点，专注于自动化逻辑，其余复杂度交给 Pydoll 处理。

================================================
FILE: docs/zh/features/automation/keyboard-control.md
================================================
# 键盘控制

键盘 API 提供了在页面级别对键盘输入的完全控制，使您能够模拟真实的输入、执行快捷键和控制复杂的按键序列。与元素级键盘方法不同，键盘 API 在页面上全局操作，为您提供与任何焦点元素交互或触发页面级键盘操作的灵活性。

!!! info "集中式键盘接口"
    所有键盘操作均可通过 `tab.keyboard` 访问，为所有键盘交互提供统一的 API。

!!! warning "重要的 CDP 限制：浏览器 UI 快捷键无法使用"
    **已知问题**：通过 Chrome DevTools Protocol 注入的事件被标记为"不可信"，**不会**触发浏览器 UI 操作或创建用户手势。
    
    **不起作用的功能：**

    - 浏览器快捷键（Ctrl+T、Ctrl+W、Ctrl+N）
    - 开发者工具快捷键（F12、Ctrl+Shift+I）
    - 浏览器导航（Ctrl+Shift+T 重新打开标签）
    - 任何修改浏览器 UI 或窗口的快捷键
    
    **完美工作的功能：**

    - 页面级快捷键（Ctrl+A、Ctrl+C、Ctrl+V、Ctrl+F）
    - 文本选择和操作
    - 表单导航（Tab、Enter、方向键）
    - 输入字段交互
    - 自定义应用快捷键（在 Web 应用中）
    
    **技术原因**：CDP 事件不会创建浏览器安全所需的"用户手势"。参见 [chromium issue #615341](https://bugs.chromium.org/p/chromium/issues/detail?id=615341) 和 [CDP 文档](https://chromedevtools.github.io/devtools-protocol/tot/Input/#method-dispatchKeyEvent)。
    
    对于浏览器级自动化，请直接使用 CDP 浏览器命令（如 `tab.close()`、`browser.new_tab()`），而不是键盘快捷键。

## 快速开始

键盘 API 提供三种主要方法:

```python
from pydoll.browser import Chrome
from pydoll.constants import Key

async with Chrome() as browser:
    tab = await browser.start()
    await tab.go_to('https://example.com')
    
    # 按下并释放一个键
    await tab.keyboard.press(Key.ENTER)
    
    # 执行快捷键组合
    await tab.keyboard.hotkey(Key.CONTROL, Key.S)  # Ctrl+S
    
    # 手动控制
    await tab.keyboard.down(Key.SHIFT)
    await tab.keyboard.press(Key.ARROWRIGHT)
    await tab.keyboard.up(Key.SHIFT)
```

## 核心方法

### Press: 完整的按键操作

`press()` 方法执行完整的按键周期（按下 → 等待 → 释放）:

```python
from pydoll.constants import Key

# 基本按键
await tab.keyboard.press(Key.ENTER)
await tab.keyboard.press(Key.TAB)
await tab.keyboard.press(Key.ESCAPE)

# 带修饰键的按键
await tab.keyboard.press(Key.S, modifiers=2)  # Ctrl+S（手动修饰符）

# 自定义按住时长
await tab.keyboard.press(Key.SPACE, interval=0.5)  # 按住 500 毫秒
```

**参数:**

- `key`: 要按下的键（来自 `Key` 枚举）
- `modifiers` (可选): 修饰符标志（Alt=1, Ctrl=2, Meta=4, Shift=8）
- `interval` (可选): 按住键的时长（秒）（默认: 0.1）

### Down: 按下键而不释放

`down()` 方法按下键但不释放它，对于按住修饰键或创建按键序列很有用:

```python
from pydoll.constants import Key

# 按住 Shift 键的同时按其他键
await tab.keyboard.down(Key.SHIFT)
await tab.keyboard.press(Key.ARROWRIGHT)  # 选择文本
await tab.keyboard.press(Key.ARROWRIGHT)  # 继续选择
await tab.keyboard.up(Key.SHIFT)

# 使用修饰符标志按下
await tab.keyboard.down(Key.A, modifiers=2)  # Ctrl+A（全选）
```

**参数:**

- `key`: 要按下的键
- `modifiers` (可选): 要应用的修饰符标志

### Up: 释放按键

`up()` 方法释放先前按下的键:

```python
from pydoll.constants import Key

# 手动按键序列
await tab.keyboard.down(Key.CONTROL)
await tab.keyboard.down(Key.SHIFT)
await tab.keyboard.press(Key.T)  # Ctrl+Shift+T
await tab.keyboard.up(Key.SHIFT)
await tab.keyboard.up(Key.CONTROL)
```

**参数:**

- `key`: 要释放的键

!!! tip "何时使用每种方法"

    - **`press()`**: 单个按键操作（Enter、Tab、字母）
    - **`hotkey()`**: 键盘快捷键（Ctrl+C、Ctrl+Shift+T）
    - **`down()`/`up()`**: 复杂序列、按住修饰键、自定义时序

## 快捷键：轻松实现键盘快捷方式

`hotkey()` 方法自动检测修饰键并正确执行快捷键:

### 基本快捷键

```python
from pydoll.constants import Key

# 常用快捷键
await tab.keyboard.hotkey(Key.CONTROL, Key.C)  # 复制
await tab.keyboard.hotkey(Key.CONTROL, Key.V)  # 粘贴
await tab.keyboard.hotkey(Key.CONTROL, Key.X)  # 剪切
await tab.keyboard.hotkey(Key.CONTROL, Key.Z)  # 撤销
await tab.keyboard.hotkey(Key.CONTROL, Key.Y)  # 重做
await tab.keyboard.hotkey(Key.CONTROL, Key.A)  # 全选
await tab.keyboard.hotkey(Key.CONTROL, Key.S)  # 保存

```

### 三键组合

```python
from pydoll.constants import Key

# 文本编辑快捷键（这些有效！）
await tab.keyboard.hotkey(Key.CONTROL, Key.SHIFT, Key.ARROWLEFT)  # 向左选择单词
await tab.keyboard.hotkey(Key.CONTROL, Key.SHIFT, Key.ARROWRIGHT)  # 向右选择单词
await tab.keyboard.hotkey(Key.CONTROL, Key.SHIFT, Key.HOME)  # 选择到文档开头
await tab.keyboard.hotkey(Key.CONTROL, Key.SHIFT, Key.END)  # 选择到文档末尾

# 应用特定快捷键（如果 Web 应用支持）
await tab.keyboard.hotkey(Key.CONTROL, Key.SHIFT, Key.Z)  # 在许多应用中重做
await tab.keyboard.hotkey(Key.CONTROL, Key.SHIFT, Key.S)  # 另存为（如果应用支持）
```

### 平台特定快捷键

```python
import sys
from pydoll.constants import Key

# 在 macOS 上使用 Meta（Command），在 Windows/Linux 上使用 Control
modifier = Key.META if sys.platform == 'darwin' else Key.CONTROL

await tab.keyboard.hotkey(modifier, Key.C)  # 复制（平台感知）
await tab.keyboard.hotkey(modifier, Key.V)  # 粘贴（平台感知）
```

### 快捷键工作原理

`hotkey()` 方法智能处理修饰键:

1. **检测修饰键**: 自动识别 Ctrl、Shift、Alt、Meta
2. **计算标志**: 使用按位或组合修饰键（Ctrl=2, Shift=8 → 10）
3. **正确应用**: 按下非修饰键时应用修饰符标志
4. **干净释放**: 按相反顺序释放键

```python
from pydoll.constants import Key

# hotkey(Key.CONTROL, Key.SHIFT, Key.T) 的幕后:
# 1. 检测: modifiers=[CONTROL, SHIFT], keys=[T]
# 2. 计算: modifier_value = 2 | 8 = 10
# 3. 执行: 按下 T，modifiers=10
# 4. 释放: 释放 T
```

!!! tip "修饰符值"
    手动使用 `modifiers` 参数时:

    - Alt = 1
    - Ctrl = 2
    - Meta/Command = 4
    - Shift = 8
    
    组合它们: Ctrl+Shift = 2 + 8 = 10

## 可用按键

`Key` 枚举提供全面的键盘覆盖:

### 字母键 (A-Z)

```python
from pydoll.constants import Key

# 所有字母 A 到 Z
await tab.keyboard.press(Key.A)
await tab.keyboard.press(Key.Z)
```

### 数字键

```python
from pydoll.constants import Key

# 顶部行数字 (0-9)
await tab.keyboard.press(Key.DIGIT0)
await tab.keyboard.press(Key.DIGIT9)

# 数字键盘数字
await tab.keyboard.press(Key.NUMPAD0)
await tab.keyboard.press(Key.NUMPAD9)
```

### 功能键

```python
from pydoll.constants import Key

# F1 到 F12
await tab.keyboard.press(Key.F1)
await tab.keyboard.press(Key.F12)
```

### 导航键

```python
from pydoll.constants import Key

await tab.keyboard.press(Key.ARROWUP)
await tab.keyboard.press(Key.ARROWDOWN)
await tab.keyboard.press(Key.ARROWLEFT)
await tab.keyboard.press(Key.ARROWRIGHT)
await tab.keyboard.press(Key.HOME)
await tab.keyboard.press(Key.END)
await tab.keyboard.press(Key.PAGEUP)
await tab.keyboard.press(Key.PAGEDOWN)
```

### 修饰键

```python
from pydoll.constants import Key

await tab.keyboard.press(Key.CONTROL)
await tab.keyboard.press(Key.SHIFT)
await tab.keyboard.press(Key.ALT)
await tab.keyboard.press(Key.META)  # macOS 上的 Command，Windows 上的 Windows 键
```

### 特殊键

```python
from pydoll.constants import Key

await tab.keyboard.press(Key.ENTER)
await tab.keyboard.press(Key.TAB)
await tab.keyboard.press(Key.SPACE)
await tab.keyboard.press(Key.BACKSPACE)
await tab.keyboard.press(Key.DELETE)
await tab.keyboard.press(Key.ESCAPE)
await tab.keyboard.press(Key.INSERT)
```

## 实用示例

### 表单导航

```python
from pydoll.browser import Chrome
from pydoll.constants import Key

async def fill_form_with_keyboard():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/form')
        
        # 聚焦第一个字段并输入
        first_field = await tab.find(id='name')
        await first_field.click()
        await first_field.insert_text('张三')
        
        # 使用 Tab 键导航到下一个字段
        await tab.keyboard.press(Key.TAB)
        await tab.keyboard.press(Key.TAB)  # 跳过一个字段
        
        # 在当前焦点字段中输入
        second_field = await tab.find(id='email')
        await second_field.insert_text('zhangsan@example.com')
        
        # 使用 Enter 提交
        await tab.keyboard.press(Key.ENTER)
```

### 文本选择和操作

```python
from pydoll.constants import Key

async def select_and_replace_text():
    # 全选文本
    await tab.keyboard.hotkey(Key.CONTROL, Key.A)
    
    # 复制选中内容
    await tab.keyboard.hotkey(Key.CONTROL, Key.C)
    
    # 移动到末尾
    await tab.keyboard.press(Key.END)
    
    # 逐字选择
    await tab.keyboard.down(Key.CONTROL)
    await tab.keyboard.down(Key.SHIFT)
    await tab.keyboard.press(Key.ARROWLEFT)
    await tab.keyboard.press(Key.ARROWLEFT)
    await tab.keyboard.up(Key.SHIFT)
    await tab.keyboard.up(Key.CONTROL)
    
    # 删除选中内容
    await tab.keyboard.press(Key.DELETE)
```

### 下拉菜单和选择导航

```python
from pydoll.constants import Key

async def navigate_dropdown():
    # 打开下拉菜单
    select = await tab.find(tag_name='select')
    await select.click()
    
    # 使用箭头键导航选项
    await tab.keyboard.press(Key.ARROWDOWN)
    await tab.keyboard.press(Key.ARROWDOWN)
    
    # 使用 Enter 选择
    await tab.keyboard.press(Key.ENTER)
    
    # 或使用 Escape 取消
    await tab.keyboard.press(Key.ESCAPE)
```

### 复杂按键序列

```python
from pydoll.constants import Key
import asyncio

async def complex_editing():
    # 选择行
    await tab.keyboard.press(Key.HOME)  # 移动到开头
    await tab.keyboard.down(Key.SHIFT)
    await tab.keyboard.press(Key.END)  # 选择到末尾
    await tab.keyboard.up(Key.SHIFT)
    
    # 剪切
    await tab.keyboard.hotkey(Key.CONTROL, Key.X)
    
    # 向下移动并粘贴
    await tab.keyboard.press(Key.ARROWDOWN)
    await tab.keyboard.hotkey(Key.CONTROL, Key.V)
    
    # 如果需要，撤销
    await tab.keyboard.hotkey(Key.CONTROL, Key.Z)
```

## 最佳实践

### 1. 添加延迟以提高可靠性

```python
from pydoll.constants import Key
import asyncio

# 好: 等待 UI 更新
await tab.keyboard.hotkey(Key.CONTROL, Key.F)  # 打开查找
await asyncio.sleep(0.2)  # 等待对话框
await tab.keyboard.press(Key.ESCAPE)  # 关闭它

# 差: 没有延迟，可能不起作用
await tab.keyboard.hotkey(Key.CONTROL, Key.F)
await tab.keyboard.press(Key.ESCAPE)  # 可能太快了
```

### 2. 输入前聚焦元素

```python
from pydoll.constants import Key

# 好: 确保元素已聚焦
input_field = await tab.find(id='search')
await input_field.click()  # 聚焦它
await input_field.insert_text('query')

# 差: 键盘输入进入错误元素
await tab.keyboard.press(Key.A)  # 这会去哪里？
```

### 3. 使用平台感知快捷键

```python
import sys
from pydoll.constants import Key

# 好: 平台感知
cmd_key = Key.META if sys.platform == 'darwin' else Key.CONTROL
await tab.keyboard.hotkey(cmd_key, Key.C)

# 差: 硬编码（在 macOS 上不起作用）
await tab.keyboard.hotkey(Key.CONTROL, Key.C)
```

### 4. 清理长序列

```python
from pydoll.constants import Key

# 好: 确保修饰键被释放
try:
    await tab.keyboard.down(Key.SHIFT)
    await tab.keyboard.press(Key.ARROWRIGHT)
    # ... 更多操作
finally:
    await tab.keyboard.up(Key.SHIFT)  # 始终释放

# 差: 错误时修饰键保持按下
await tab.keyboard.down(Key.SHIFT)
await tab.keyboard.press(Key.ARROWRIGHT)
# 这里出错会让 Shift 保持按下！
```

## 按键参考表

### 常用页面级快捷键（这些有效！）

| 操作 | Windows/Linux | macOS | 备注 |
|------|--------------|-------|------|
| 复制 | Ctrl+C | Cmd+C | 有效 |
| 粘贴 | Ctrl+V | Cmd+V | 有效 |
| 剪切 | Ctrl+X | Cmd+X | 有效 |
| 撤销 | Ctrl+Z | Cmd+Z | 有效 |
| 重做 | Ctrl+Y | Cmd+Y | 有效 |
| 全选 | Ctrl+A | Cmd+A | 有效 |
| 查找 | Ctrl+F | Cmd+F | 仅当 Web 应用实现时 |
| 保存 | Ctrl+S | Cmd+S | 仅当 Web 应用实现时 |
| 刷新 | F5 或 Ctrl+R | Cmd+R | 改用 `await tab.refresh()` |

### 浏览器快捷键（通过 CDP 无法使用）

| 操作 | 快捷键 | 改用 |
|------|--------|------|
| 新标签 | Ctrl+T | `await browser.new_tab()` |
| 关闭标签 | Ctrl+W | `await tab.close()` |
| 重新打开标签 | Ctrl+Shift+T | 手动跟踪标签 |
| 开发者工具 | F12, Ctrl+Shift+I | 已经可以通过 CDP 访问！ |
| 地址栏 | Ctrl+L | `await tab.go_to(url)` |

### 所有可用按键

| 类别 | 按键 |
|------|------|
| **字母** | `Key.A` 到 `Key.Z` (26 个键) |
| **数字** | `Key.DIGIT0` 到 `Key.DIGIT9` (10 个键) |
| **数字键盘** | `Key.NUMPAD0` 到 `Key.NUMPAD9`, `NUMPADMULTIPLY`, `NUMPADADD`, `NUMPADSUBTRACT`, `NUMPADDECIMAL`, `NUMPADDIVIDE` |
| **功能键** | `Key.F1` 到 `Key.F12` (12 个键) |
| **导航** | `ARROWUP`, `ARROWDOWN`, `ARROWLEFT`, `ARROWRIGHT`, `HOME`, `END`, `PAGEUP`, `PAGEDOWN` |
| **修饰键** | `CONTROL`, `SHIFT`, `ALT`, `META` |
| **特殊键** | `ENTER`, `TAB`, `SPACE`, `BACKSPACE`, `DELETE`, `ESCAPE`, `INSERT` |
| **锁定键** | `CAPSLOCK`, `NUMLOCK`, `SCROLLLOCK` |
| **符号** | `SEMICOLON`, `EQUALSIGN`, `COMMA`, `MINUS`, `PERIOD`, `SLASH`, `GRAVEACCENT`, `BRACKETLEFT`, `BACKSLASH`, `BRACKETRIGHT`, `QUOTE` |

### 修饰符标志值

| 修饰符 | 值 | 二进制 | 用法 |
|--------|---|--------|------|
| Alt | 1 | 0001 | `modifiers=1` |
| Ctrl | 2 | 0010 | `modifiers=2` |
| Meta | 4 | 0100 | `modifiers=4` |
| Shift | 8 | 1000 | `modifiers=8` |
| Ctrl+Shift | 10 | 1010 | `modifiers=10` |
| Ctrl+Alt | 3 | 0011 | `modifiers=3` |
| Ctrl+Shift+Alt | 11 | 1011 | `modifiers=11` |

## 从 WebElement 方法迁移

先前在 `WebElement` 上的键盘方法已弃用。以下是如何迁移:

### 旧 vs 新

```python
from pydoll.constants import Key

# 旧（已弃用）
element = await tab.find(id='input')
await element.key_down(Key.A, modifiers=2)
await element.key_up(Key.A)
await element.press_keyboard_key(Key.ENTER)

# 新（推荐）
await tab.keyboard.down(Key.A, modifiers=2)
await tab.keyboard.up(Key.A)
await tab.keyboard.press(Key.ENTER)
```

!!! warning "弃用通知"
    以下 `WebElement` 方法已弃用:

    - `key_down()` → 使用 `tab.keyboard.down()`
    - `key_up()` → 使用 `tab.keyboard.up()`
    - `press_keyboard_key()` → 使用 `tab.keyboard.press()`
    
    这些方法仍然可以工作以保持向后兼容性，但会显示弃用警告。

### 为什么要迁移？

- **集中化**: 所有键盘操作在一个地方
- **更清晰的 API**: 所有键盘操作的一致接口
- **更强大**: 快捷键支持，智能修饰符检测
- **更好的类型支持**: 完整的 IDE 自动完成支持

## 了解更多

有关其他自动化功能:

- **[人性化交互](human-interactions.md)**: 真实的点击、滚动和鼠标移动
- **[表单处理](form-handling.md)**: 完整的表单自动化工作流程
- **[文件操作](file-operations.md)**: 文件上传自动化

键盘 API 消除了键盘自动化的复杂性，为从简单按键到复杂快捷键和序列的所有内容提供了干净、可靠的方法。


================================================
FILE: docs/zh/features/automation/mouse-control.md
================================================
# 鼠标控制

鼠标API提供页面级别的完整鼠标输入控制，支持模拟逼真的光标移动、点击、双击和拖拽操作。当传入`humanize=True`时，鼠标操作使用人性化模拟：路径遵循自然贝塞尔曲线，配合菲茨定律时序、最小急动速度曲线、生理性手抖和过冲修正，使自动化操作几乎无法与人类行为区分。

!!! info "集中式鼠标接口"
    所有鼠标操作均通过`tab.mouse`访问，为所有鼠标交互提供简洁统一的API。

## 快速开始

```python
from pydoll.browser.chromium import Chrome
from pydoll.protocol.input.types import MouseButton

async with Chrome() as browser:
    tab = await browser.start()
    await tab.go_to('https://example.com')

    # 移动光标到指定位置
    await tab.mouse.move(500, 300)

    # 在指定位置点击
    await tab.mouse.click(500, 300)

    # 右键点击
    await tab.mouse.click(500, 300, button=MouseButton.RIGHT)

    # 双击
    await tab.mouse.double_click(500, 300)

    # 从一个位置拖拽到另一个位置
    await tab.mouse.drag(100, 200, 500, 400)
```

## 核心方法

### move: 移动光标

将鼠标光标移动到页面上的指定位置：

```python
# 默认移动（单个CDP事件，无模拟）
await tab.mouse.move(500, 300)

# 人性化移动（自然时序的曲线路径）
await tab.mouse.move(500, 300, humanize=True)
```

**参数：**

- `x`：目标X坐标（CSS像素）
- `y`：目标Y坐标（CSS像素）
- `humanize`（仅关键字）：模拟人类般的曲线移动（默认：`False`）

### click: 在指定位置点击

移动到指定位置并执行鼠标点击：

```python
from pydoll.protocol.input.types import MouseButton

# 左键点击（默认，瞬时）
await tab.mouse.click(500, 300)

# 右键点击
await tab.mouse.click(500, 300, button=MouseButton.RIGHT)

# 通过click_count实现双击
await tab.mouse.click(500, 300, click_count=2)

# 人性化点击，自然移动
await tab.mouse.click(500, 300, humanize=True)
```

**参数：**

- `x`：目标X坐标
- `y`：目标Y坐标
- `button`（仅关键字）：鼠标按钮，可选 `LEFT`、`RIGHT`、`MIDDLE`（默认：`LEFT`）
- `click_count`（仅关键字）：点击次数（默认：`1`）
- `humanize`（仅关键字）：模拟人类般的行为（默认：`False`）

### double_click: 在指定位置双击

等价于`click(x, y, click_count=2)`的便捷方法：

```python
await tab.mouse.double_click(500, 300)
await tab.mouse.double_click(500, 300, humanize=False)
```

### down / up: 底层按钮控制

独立按下或释放鼠标按钮：

```python
# 在当前位置按下左键
await tab.mouse.down()

# 释放左键
await tab.mouse.up()

# 右键
await tab.mouse.down(button=MouseButton.RIGHT)
await tab.mouse.up(button=MouseButton.RIGHT)
```

这些是底层原语，在当前光标位置操作，没有`humanize`参数。

### drag: 拖放

按住鼠标按钮从起点移动到终点：

```python
# 默认拖拽（瞬时）
await tab.mouse.drag(100, 200, 500, 400)

# 人性化拖拽，自然移动
await tab.mouse.drag(100, 200, 500, 400, humanize=True)
```

**参数：**

- `start_x`、`start_y`：起始坐标
- `end_x`、`end_y`：结束坐标
- `humanize`（仅关键字）：模拟人类般的拖拽（默认：`False`）

## 启用人性化

所有鼠标方法默认使用`humanize=False`。要启用带有自然贝塞尔曲线路径和真实时序的人性化模拟，传入`humanize=True`：

```python
# 人性化移动，菲茨定律时序的自然曲线路径
await tab.mouse.move(500, 300, humanize=True)

# 人性化点击：曲线移动+点击前停顿+按下+释放
await tab.mouse.click(500, 300, humanize=True)

# 人性化拖拽，自然曲线和停顿
await tab.mouse.drag(100, 200, 500, 400, humanize=True)
```

当规避检测很重要时推荐使用，例如与采用机器人检测的网站交互时。

## 人性化模式

当传入`humanize=True`时，鼠标模块应用多层逼真效果：

### 贝塞尔曲线路径

鼠标沿自然曲线轨迹移动，而非直线。控制点在起点→终点连线的垂直方向上随机偏移，采用非对称放置（移动初期曲率更大，模拟真实的弹道伸展）。

### 菲茨定律时序

移动持续时间遵循菲茨定律：`MT = a + b × log₂(D/W + 1)`。距离越远所需时间成比例增加，符合人类运动控制行为。

### 最小急动速度曲线

光标遵循钟形速度曲线，起始缓慢，中间加速到峰值速度，然后在末尾减速。这符合最平滑的人类运动轨迹。

### 生理性手抖

每帧添加小幅高斯噪声（σ ≈ 1像素），模拟手部震颤。颤抖幅度与速度成反比，光标缓慢或悬停时颤抖更多，快速弹道运动时颤抖减少。

### 过冲与修正

对于快速长距离移动（约70%概率），光标会超过目标3–12%的距离，然后做一个小的修正子运动回到目标。这符合真实人类运动控制数据。

### 点击前停顿

人性化点击包含点击前停顿（50–200毫秒），模拟按下按钮前的自然稳定时间。

## 自动人性化元素点击

当您使用`element.click(humanize=True)`时，鼠标API会从当前光标位置到元素中心产生逼真的贝塞尔曲线运动后再点击，使元素点击与人类行为无法区分。

```python
# 默认点击：原始CDP按下/释放
button = await tab.find(id='submit')
await button.click()

# 带中心偏移
await button.click(x_offset=10, y_offset=5)

# 人性化点击：贝塞尔曲线运动+点击
await button.click(humanize=True)
```

位置追踪在元素点击之间保持。点击元素A，然后点击元素B，会产生从A到B的自然曲线路径。

## 自定义时序配置

所有人性化参数均可通过`MouseTimingConfig`配置：

```python
from pydoll.interactions.mouse import MouseTimingConfig

config = MouseTimingConfig(
    fitts_a=0.070,              # 菲茨定律截距（秒）
    fitts_b=0.150,              # 菲茨定律斜率（秒/比特）
    frame_interval=0.012,       # mouseMoved事件间的基础间隔
    curvature_min=0.10,         # 最小路径曲率（距离的分数）
    curvature_max=0.30,         # 最大路径曲率
    tremor_amplitude=1.0,       # 颤抖sigma值（像素）
    overshoot_probability=0.70, # 快速移动时过冲的概率
    min_duration=0.08,          # 最小移动持续时间
    max_duration=2.5,           # 最大移动持续时间
)

# 应用到tab的鼠标实例
tab.mouse.timing = config
```

查看`MouseTimingConfig`数据类了解所有可用参数。

## 位置追踪

鼠标API在操作之间追踪光标位置：

```python
# 初始位置为(0, 0)
await tab.mouse.move(100, 200)
# 位置现在是(100, 200)

await tab.mouse.click(300, 400)
# 位置现在是(300, 400)

# 底层方法使用追踪的位置
await tab.mouse.down()   # 在(300, 400)按下
await tab.mouse.up()     # 在(300, 400)释放
```

!!! note "位置状态"
    鼠标位置在内部追踪。`WebElement.click()`在可用时自动使用`tab.mouse`，因此位置追踪在元素点击之间保持一致。

## 调试模式

启用调试模式以在页面上可视化鼠标移动。激活后，彩色点将绘制在透明覆盖画布上：

- **蓝色点**：移动过程中的光标路径
- **红色点**：点击位置

```python
# 通过属性在运行时启用
tab.mouse.debug = True

# 现在所有移动都会绘制彩色点
await tab.mouse.click(500, 300)

# 完成后禁用
tab.mouse.debug = False
```

这对于调整时序参数和验证路径是否自然很有用。

## 实用示例

### 以逼真移动点击按钮

```python
async def click_button_naturally(tab):
    # element.click() 自动使用 tab.mouse 进行人性化移动
    button = await tab.find(id='submit')
    await button.click()
```

### 拖动滑块

```python
async def drag_slider(tab):
    slider = await tab.find(css_selector='.slider-handle')
    bounds = await slider.get_bounds_using_js()

    start_x = bounds['x'] + bounds['width'] / 2
    start_y = bounds['y'] + bounds['height'] / 2
    end_x = start_x + 200  # 向右拖拽200像素

    await tab.mouse.drag(start_x, start_y, end_x, start_y)
```

### 悬停在元素上

```python
async def hover_menu(tab):
    menu = await tab.find(css_selector='.dropdown-trigger')
    bounds = await menu.get_bounds_using_js()

    await tab.mouse.move(
        bounds['x'] + bounds['width'] / 2,
        bounds['y'] + bounds['height'] / 2,
    )
    # 菜单现在应通过CSS :hover可见
```

## 了解更多

- **[类人交互](human-interactions.md)**：所有人性化交互的概述
- **[键盘控制](keyboard-control.md)**：逼真的键盘模拟


================================================
FILE: docs/zh/features/automation/screenshots-and-pdfs.md
================================================
# 截图与PDF

Pydoll通过直接使用Chrome DevTools Protocol命令提供强大的截图和PDF生成功能。可以捕获完整页面、特定元素或生成具有精细控制的PDF。

## 截图

### 基础页面截图

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def take_page_screenshot():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # 保存截图到文件
        await tab.take_screenshot('page.png', quality=100)

asyncio.run(take_page_screenshot())
```

### 支持的格式

Pydoll基于文件扩展名支持三种图像格式：

```python
# PNG格式（无损，文件较大）
await tab.take_screenshot('screenshot.png', quality=100)

# JPEG格式（有损，文件较小）
await tab.take_screenshot('screenshot.jpeg', quality=85)

# WebP格式（现代、高效）
await tab.take_screenshot('screenshot.webp', quality=90)
```

!!! info "格式检测"
    图像格式由文件扩展名自动确定。使用不支持的扩展名会引发`InvalidFileExtension`异常。
    
    JPEG格式同时支持`.jpg`和`.jpeg`（`.jpg`会自动在内部标准化为`.jpeg`以匹配CDP要求）。

### 截图参数

| 参数 | 类型 | 默认值 | 描述 |
|-----------|------|---------|-------------|
| `path` | `Optional[str]` | `None` | 保存截图的文件路径。如果`as_base64=False`则为必需。 |
| `quality` | `int` | `100` | 图像质量（0-100）。值越高质量越好，文件越大。 |
| `beyond_viewport` | `bool` | `False` | 捕获整个可滚动页面，而不仅仅是可见区域。 |
| `as_base64` | `bool` | `False` | 返回base64编码的字符串而不是保存到文件。 |

### 完整页面截图

捕获超出可见视口的内容：

```python
async def full_page_screenshot():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/long-page')
        
        # 捕获整个页面，包括折叠下方的内容
        await tab.take_screenshot(
            'full-page.png',
            beyond_viewport=True,
            quality=90
        )
```

!!! warning "性能注意"
    在非常长的页面上使用`beyond_viewport=True`可能会消耗大量内存并需要更长的处理时间。

### Base64截图

获取截图的base64字符串用于嵌入或通过API发送：

```python
async def base64_screenshot():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # 获取截图的base64字符串
        screenshot_base64 = await tab.take_screenshot(
            as_base64=True
        )
        
        # 在HTML img标签中使用
        html = f'<img src="data:image/png;base64,{screenshot_base64}" />'
        
        # 或通过API发送
        import aiohttp
        async with aiohttp.ClientSession() as session:
            await session.post(
                'https://api.example.com/upload',
                json={'image': screenshot_base64}
            )
```

### 元素截图

捕获特定元素而非整个页面：

```python
async def element_screenshot():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # 截取特定元素（PNG）
        header = await tab.find(tag_name='header')
        await header.take_screenshot('header.png', quality=100)
        
        # 截取表单（JPEG）
        form = await tab.find(id='login-form')
        await form.take_screenshot('login-form.jpeg', quality=85)
        
        # 截取图表或图形（WebP）
        chart = await tab.find(class_name='data-visualization')
        await chart.take_screenshot('chart.webp', quality=90)
```

!!! info "格式检测"
    图像格式自动从文件扩展名（`.png`、`.jpeg`/`.jpg`或`.webp`）检测。使用不支持的扩展名会引发`InvalidFileExtension`异常。

!!! tip "自动滚动"
    捕获元素截图时，Pydoll会在截图前自动将元素滚动到视图中。

### 元素截图 vs 页面截图

| 功能 | `tab.take_screenshot()` | `element.take_screenshot()` |
|---------|------------------------|----------------------------|
| **范围** | 整个视口或页面 | 仅特定元素 |
| **格式支持** | PNG, JPEG, WebP | PNG, JPEG, WebP |
| **超出视口** | ✅ 支持 | ❌ 不适用 |
| **Base64输出** | ✅ 支持 | ✅ 支持 |
| **自动滚动** | ❌ 不适用 | ✅ 是 |
| **使用场景** | 完整页面捕获 | 组件隔离、测试 |


## PDF生成

### 基础PDF导出

将页面转换为打印质量的PDF输出：

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def generate_pdf():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/document')
        
        # 使用Path生成PDF
        await tab.print_to_pdf(Path('document.pdf'))
        
        # 或使用字符串
        await tab.print_to_pdf('document.pdf')

asyncio.run(generate_pdf())
```

### PDF参数

| 参数 | 类型 | 默认值 | 描述 |
|-----------|------|---------|-------------|
| `path` | `Optional[str \| Path]` | `None` | 保存PDF的文件路径。如果`as_base64=False`则为必需。 |
| `landscape` | `bool` | `False` | 使用横向方向（相对于纵向）。 |
| `display_header_footer` | `bool` | `False` | 包含浏览器生成的页眉/页脚，带有标题、URL、页码。 |
| `print_background` | `bool` | `True` | 包含背景图形和颜色。 |
| `scale` | `float` | `1.0` | 页面缩放因子（0.1-2.0）。用于放大/缩小效果。 |
| `as_base64` | `bool` | `False` | 返回base64编码的字符串而不是保存到文件。 |

!!! tip "Path vs 字符串"
    虽然推荐使用`pathlib`的`Path`对象作为最佳实践以获得更好的路径处理和跨平台兼容性，但如果您愿意，也可以使用普通字符串。

### 高级PDF选项

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def advanced_pdf():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/report')
        
        # 带页眉/页脚的横向PDF
        await tab.print_to_pdf(
            Path('report-landscape.pdf'),
            landscape=True,
            display_header_footer=True,
            print_background=True,
            scale=0.9
        )
        
        # 无背景的纵向PDF（节省墨水）
        await tab.print_to_pdf(
            Path('report-ink-friendly.pdf'),
            landscape=False,
            print_background=False,
            scale=1.0
        )

asyncio.run(advanced_pdf())
```

### PDF缩放因子

控制PDF输出的缩放级别：

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def scaled_pdfs():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/content')
        
        # 缩小内容以在每页上容纳更多
        await tab.print_to_pdf(Path('compact.pdf'), scale=0.7)
        
        # 正常缩放
        await tab.print_to_pdf(Path('normal.pdf'), scale=1.0)
        
        # 放大内容（页数更少）
        await tab.print_to_pdf(Path('large.pdf'), scale=1.5)

asyncio.run(scaled_pdfs())
```

!!! warning "缩放限制"
    `scale`参数接受`0.1`到`2.0`之间的值。超出此范围的值可能产生意外结果。

### Base64 PDF

生成PDF的base64字符串用于API传输：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def base64_pdf():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/invoice')
        
        # 获取PDF的base64（无需路径）
        pdf_base64 = await tab.print_to_pdf(as_base64=True)
        
        # 通过API发送
        import aiohttp
        async with aiohttp.ClientSession() as session:
            await session.post(
                'https://api.example.com/invoices',
                json={'pdf': pdf_base64}
            )

asyncio.run(base64_pdf())
```


!!! info "CDP参考"
    有关这些命令的完整CDP文档，请参阅：
    
    - [Page.captureScreenshot](https://chromedevtools.github.io/devtools-protocol/tot/Page/#method-captureScreenshot)
    - [Page.printToPDF](https://chromedevtools.github.io/devtools-protocol/tot/Page/#method-printToPDF)

### 错误处理

```python
from pydoll.exceptions import (
    InvalidFileExtension,
    MissingScreenshotPath,
    TopLevelTargetRequired
)

async def safe_screenshot():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        try:
            # 缺少路径且as_base64=False
            await tab.take_screenshot()
        except MissingScreenshotPath:
            print("错误：必须提供路径或设置as_base64=True")
        
        try:
            # 无效的扩展名
            await tab.take_screenshot('image.bmp')
        except InvalidFileExtension as e:
            print(f"错误：{e}")
        
        # IFrame截图限制
        iframe_element = await tab.find(tag_name='iframe')

        # 仍然无效：顶层截图不会包含 iframe 内容
        # await tab.take_screenshot('frame.png')

        # 选择 iframe 内部的元素进行截图
        content = await iframe_element.find(id='content')
        await content.take_screenshot('iframe-content.png')
```

## 页面打包导出

将整个页面及其所有资源（CSS、JS、图片、字体）保存为 `.zip` 压缩包，支持离线查看。

### 基本用法

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def save_page():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')

        # 将页面和资源保存为独立文件
        await tab.save_bundle('page.zip')

asyncio.run(save_page())
```

生成的 zip 包含一个 `index.html`，所有 URL 已被重写为引用 `assets/` 目录下的本地文件。

### 内联模式

使用 data URI、`<style>` 和 `<script>` 标签将所有内容直接嵌入到单个 `index.html` 中：

```python
# zip 中只包含一个自包含的 HTML 文件
await tab.save_bundle('page-inline.zip', inline_assets=True)
```

### 参数

| 参数 | 类型 | 默认值 | 描述 |
|------|------|--------|------|
| `path` | `str \| Path` | *（必填）* | 目标路径，必须以 `.zip` 结尾。 |
| `inline_assets` | `bool` | `False` | 将所有资源内联嵌入，而非保存为独立文件。 |

!!! info "打包包含的内容"
    打包包括以下类型的资源：Document、Stylesheet、Script、Image、Font 和 Media。加载失败、已取消或使用 `data:` URI 的资源会被自动跳过。

## 了解更多

有关截图和PDF如何与Pydoll架构集成的更多信息：

- **[深入探讨：CDP](../../deep-dive/fundamentals/cdp.md)**：理解Chrome DevTools Protocol命令
- **[API参考：Tab](../../api/browser/tab.md#take_screenshot)**：完整的方法签名和参数
- **[API参考：WebElement](../../api/elements/web-element.md#take_screenshot)**：元素特定的截图能力

截图和PDF是自动化、测试和文档编制的必备工具。Pydoll的直接CDP集成提供专业级输出和精细控制。


================================================
FILE: docs/zh/features/browser-management/contexts.md
================================================
# 浏览器上下文

浏览器上下文是Pydoll在单个浏览器进程内创建完全隔离的浏览环境的解决方案。可以将它们视为独立的"隐私窗口"，但具有完全的编程控制，每个上下文维护自己的Cookie、存储、缓存和认证状态。

## 快速入门

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def basic_context_example():
    async with Chrome() as browser:
        # 在默认上下文中启动浏览器并创建初始标签页
        initial_tab = await browser.start()
        await initial_tab.go_to('https://example.com')
        
        # 创建隔离的上下文
        context_id = await browser.create_browser_context()
        
        # 在隔离上下文中创建新标签页
        isolated_tab = await browser.new_tab('https://example.com', browser_context_id=context_id)
        
        # 两个标签页完全隔离 - 不同的Cookie、存储等
        await initial_tab.execute_script("localStorage.setItem('user', 'Alice')")
        await isolated_tab.execute_script("localStorage.setItem('user', 'Bob')")
        
        # 验证隔离
        user_default = await initial_tab.execute_script("return localStorage.getItem('user')")
        user_isolated = await isolated_tab.execute_script("return localStorage.getItem('user')")
        
        print(f"默认上下文: {user_default}")  # Alice
        print(f"隔离上下文: {user_isolated}")  # Bob

asyncio.run(basic_context_example())
```

## 什么是浏览器上下文？

浏览器上下文是单个浏览器进程内的隔离浏览环境。每个上下文维护完全独立的：

| 组件 | 描述 | 隔离级别 |
|-----------|-------------|-----------------|
| **Cookie** | HTTP Cookie和会话数据 | ✓ 完全隔离 |
| **本地存储** | `localStorage`和`sessionStorage` | ✓ 完全隔离 |
| **IndexedDB** | 客户端数据库 | ✓ 完全隔离 |
| **缓存** | HTTP缓存和资源 | ✓ 完全隔离 |
| **权限** | 地理位置、通知、摄像头等 | ✓ 完全隔离 |
| **认证** | 登录会话和认证令牌 | ✓ 完全隔离 |
| **Service Workers** | 后台脚本 | ✓ 完全隔离 |

```mermaid
graph LR
    Browser[浏览器进程] --> Default[默认上下文]
    Browser --> Context1[上下文1]
    Browser --> Context2[上下文2]
    
    Default --> T1[标签A]
    Default --> T2[标签B]
    Context1 --> T3[标签C]
    Context2 --> T4[标签D]
```

## 为什么使用浏览器上下文？

### 1. 多账户测试

同时测试不同的用户账户而不产生干扰：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def perform_login(tab, email, password):
    """
    辅助函数：导航到登录页面
    并提交账户凭据。
    """
    print(f"尝试使用以下账户登录：{email}...")
    await tab.go_to('https://app.example.com/login')

    # 查找元素
    email_field = await tab.find(id='email')
    password_field = await tab.find(id='password')
    login_btn = await tab.find(id='login-btn')

    # 填写凭据并点击
    await email_field.type_text(email)
    await password_field.type_text(password)
    await login_btn.click()

    # 等待登录处理
    await asyncio.sleep(2)
    print(f"{email} 登录成功。")


async def multi_account_test():
    """
    使用隔离的浏览器上下文
    测试同时登录的主脚本。
    """
    accounts = [
        {"email": "user1@example.com", "password": "pass1"},
        {"email": "user2@example.com", "password": "pass2"},
        {"email": "admin@example.com", "password": "admin_pass"}
    ]

    # 此列表将存储每个活动用户会话的信息
    user_sessions = []

    async with Chrome() as browser:
        first_account = accounts[0]
        initial_tab = await browser.start()
        await perform_login(initial_tab, first_account['email'], first_account['password'])
        user_sessions.append({
            "email": first_account['email'],
            "tab": initial_tab,
            "context_id": None  # 'None' 表示默认浏览器上下文
        })

        # 遍历其余账户
        for account in accounts[1:]:
            context_id = await browser.create_browser_context()
            new_tab = await browser.new_tab(browser_context_id=context_id)
            await perform_login(new_tab, account['email'], account['password'])

            # 将新会话信息添加到列表
            user_sessions.append({
                "email": account['email'],
                "tab": new_tab,
                "context_id": context_id
            })

        print("\n--- 验证所有活动会话 ---")
        for session in user_sessions:
            tab = session["tab"]
            email = session["email"]
            await tab.go_to('https://app.example.com/dashboard')
            username = await tab.find(class_name='username')
            username_text = await username.text
            print(f"[账户：{email}] -> 登录为：{username_text}")
            await asyncio.sleep(0.5)

        print("\n--- 清理上下文 ---")
        for session in user_sessions:
            # 仅关闭我们创建的上下文（非None）
            if session["context_id"] is not None:
                print(f"关闭上下文：{session['email']}")
                await session["tab"].close()
                await browser.delete_browser_context(session["context_id"])
        
        # 默认上下文（None）由
        # 'async with Chrome() as browser' 自动关闭

asyncio.run(multi_account_test())
```

### 2. 使用上下文特定代理的地理位置测试

每个上下文可以拥有自己的代理配置：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def geo_location_testing():
    async with Chrome() as browser:
        # 启动浏览器并使用初始标签页进行第一个测试（默认上下文，无代理）
        initial_tab = await browser.start()
        await initial_tab.go_to('https://api.ipify.org')
        await asyncio.sleep(2)
        default_ip = await initial_tab.execute_script('return document.body.textContent')
        print(f"默认IP（无代理）：{default_ip}")
        
        # 带美国代理的美国上下文
        us_context = await browser.create_browser_context(
            proxy_server='http://us-proxy.example.com:8080'
        )
        us_tab = await browser.new_tab('https://api.ipify.org', browser_context_id=us_context)
        await asyncio.sleep(2)
        us_ip = await us_tab.execute_script('return document.body.textContent')
        print(f"美国IP：{us_ip}")
        
        # 带欧盟代理的欧盟上下文
        eu_context = await browser.create_browser_context(
            proxy_server='http://eu-proxy.example.com:8080'
        )
        eu_tab = await browser.new_tab('https://api.ipify.org', browser_context_id=eu_context)
        await asyncio.sleep(2)
        eu_ip = await eu_tab.execute_script('return document.body.textContent')
        print(f"欧盟IP：{eu_ip}")
        
        # 清理（跳过初始标签页）
        await us_tab.close()
        await eu_tab.close()
        await browser.delete_browser_context(us_context)
        await browser.delete_browser_context(eu_context)

asyncio.run(geo_location_testing())
```

!!! tip "代理认证"
    Pydoll自动处理上下文的代理认证。只需在URL中包含凭据：
    ```python
    context_id = await browser.create_browser_context(
        proxy_server='http://username:password@proxy.example.com:8080'
    )
    ```
    凭据从CDP命令中清理，仅在浏览器要求认证时使用。

### 3. A/B测试

并行比较不同的用户体验：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def ab_testing():
    async with Chrome() as browser:
        # 启动浏览器并创建初始标签页（默认上下文中的对照组）
        initial_tab = await browser.start()
        await initial_tab.go_to('https://example.com')
        await initial_tab.execute_script("localStorage.setItem('experiment', 'control')")
        
        # 隔离上下文中的实验组
        context_b = await browser.create_browser_context()
        tab_b = await browser.new_tab('https://example.com', browser_context_id=context_b)
        await tab_b.execute_script("localStorage.setItem('experiment', 'treatment')")
        
        # 将两者导航到功能页面
        await initial_tab.go_to('https://example.com/feature')
        await tab_b.go_to('https://example.com/feature')
        
        # 比较结果
        result_a = await initial_tab.find(class_name='experiment-result')
        result_b = await tab_b.find(class_name='experiment-result')
        
        print(f"对照组结果：{await result_a.text}")
        print(f"实验组结果：{await result_b.text}")
        
        # 清理
        await tab_b.close()
        await browser.delete_browser_context(context_b)

asyncio.run(ab_testing())
```

### 4. 并行网页抓取

使用不同配置抓取多个网站：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def parallel_scraping():
    websites = [
        {'url': 'https://news.ycombinator.com', 'selector': '.storylink'},
        {'url': 'https://reddit.com/r/python', 'selector': '.title'},
        {'url': 'https://github.com/trending', 'selector': '.h3'},
    ]
    
    async with Chrome() as browser:
        # 启动浏览器并获取初始标签页
        initial_tab = await browser.start()
        
        # 为其余网站创建上下文（第一个使用默认上下文）
        contexts = [None] + [await browser.create_browser_context() for _ in websites[1:]]
        
        # 创建标签页（为第一个网站重用初始标签页）
        tabs = [initial_tab] + [
            await browser.new_tab(browser_context_id=ctx) for ctx in contexts[1:]
        ]
        
        async def scrape_site(tab, site, context_id):
            """在给定的标签页和上下文内抓取单个网站"""
            try:
                await tab.go_to(site['url'])
                await asyncio.sleep(3)
                
                # 使用CSS选择器提取标题
                elements = await tab.query(site['selector'], find_all=True)
                titles = [await elem.text for elem in elements[:5]]
                
                return {'url': site['url'], 'titles': titles}
            finally:
                # 清理上下文（跳过初始标签页的默认上下文）
                if context_id is not None:
                    await tab.close()
                    await browser.delete_browser_context(context_id)
        
        # 并发抓取所有网站
        results = await asyncio.gather(*[
            scrape_site(tab, site, ctx) for tab, site, ctx in zip(tabs, websites, contexts)
        ])
        
        # 显示结果
        for result in results:
            print(f"\n{result['url']}:")
            for i, title in enumerate(result['titles'], 1):
                print(f"  {i}. {title}")

asyncio.run(parallel_scraping())
```

## 理解上下文性能

### 上下文是轻量级的

!!! info "性能特征"
    创建浏览器上下文**显著快于且更轻量**于启动新的浏览器进程：
    
    - **上下文创建**：约50-100毫秒，内存开销最小
    - **新浏览器进程**：约2-5秒，基础内存50-150 MB
    
    对于10个隔离环境：

    - **1个浏览器中的10个上下文**：约500毫秒启动，总计约500 MB
    - **10个独立浏览器**：约30秒启动，总计约1-1.5 GB

```python
import asyncio
import time
from pydoll.browser.chromium import Chrome

async def benchmark_contexts_vs_browsers():
    # Benchmark contexts
    start = time.time()
    async with Chrome() as browser:
        # 启动浏览器（此示例中未使用初始标签页）
        await browser.start()
        
        contexts = []
        for i in range(10):
            context_id = await browser.create_browser_context()
            contexts.append(context_id)
        
        print(f"创建10个上下文耗时：{time.time() - start:.2f}秒")
        
        # 清理
        for context_id in contexts:
            await browser.delete_browser_context(context_id)

asyncio.run(benchmark_contexts_vs_browsers())
```

### 无头模式 vs 有头模式：窗口行为

!!! warning "重要：有头模式中的上下文窗口"
    在**有头模式**（可见的浏览器UI）下运行时，有一个重要的行为需要理解：
    
    **在新上下文中创建的第一个标签页将打开一个新的操作系统窗口。**
    
    - 这是因为上下文需要一个"宿主窗口"来渲染其第一个页面
    - 该上下文中的后续标签页可以作为该窗口内的标签页打开
    - 这是CDP/Chromium的限制，而非Pydoll的设计选择
    
    **在无头模式下**，这不重要——不会创建窗口，一切都在后台运行。

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def demonstrate_window_behavior():
    # 有头模式 - 将看到窗口
    options_headed = ChromiumOptions()
    options_headed.headless = False
    
    async with Chrome(options=options_headed) as browser:
        # 启动浏览器并创建初始标签页（在默认上下文中打开第一个窗口）
        initial_tab = await browser.start()
        await initial_tab.go_to('https://example.com')
        
        # 创建新上下文 - 第一个标签页将打开一个新窗口
        context = await browser.create_browser_context()
        tab2 = await browser.new_tab('https://github.com', browser_context_id=context)
        
        # 同一上下文中的第二个标签页 - 在现有窗口中作为标签页打开
        tab3 = await browser.new_tab('https://google.com', browser_context_id=context)
        
        await asyncio.sleep(10)  # 观察窗口
        
        await tab2.close()
        await tab3.close()
        await browser.delete_browser_context(context)

# 无头模式 - 无窗口，上下文不可见但仍然隔离
async def headless_contexts():
    options = ChromiumOptions()
    options.headless = True  # 无可见窗口
    
    async with Chrome(options=options) as browser:
        # 在默认上下文中启动浏览器并创建初始标签页
        initial_tab = await browser.start()
        await initial_tab.go_to('https://example.com/page0')
        
        # 再创建4个上下文 - 未打开窗口，全部在后台
        contexts = []
        for i in range(1, 5):
            context_id = await browser.create_browser_context()
            tab = await browser.new_tab(f'https://example.com/page{i}', browser_context_id=context_id)
            contexts.append((context_id, tab))
        
        print(f"创建了{len(contexts) + 1}个隔离上下文（1个默认 + {len(contexts)}个自定义，不可见）")
        
        # 清理
        for context_id, tab in contexts:
            await tab.close()
            await browser.delete_browser_context(context_id)

asyncio.run(headless_contexts())
```

!!! tip "最佳实践：对上下文使用无头模式"
    为了在多个上下文中实现最大效率：
    
    - **开发/调试**：使用有头模式查看发生的情况
    - **生产/CI/CD**：使用无头模式以获得更快、更轻量的执行
    - **多个上下文**：强烈建议使用无头模式以避免窗口管理的复杂性

## 上下文管理

### 创建上下文

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def create_context_example():
    async with Chrome() as browser:
        await browser.start()
        
        # 创建基本上下文
        context_id = await browser.create_browser_context()
        print(f"已创建上下文：{context_id}")
        
        # 创建带代理的上下文
        proxied_context = await browser.create_browser_context(
            proxy_server='http://proxy.example.com:8080',
            proxy_bypass_list='localhost,127.0.0.1'
        )
        print(f"已创建代理上下文：{proxied_context}")
        
        # 创建带认证代理的上下文
        auth_context = await browser.create_browser_context(
            proxy_server='http://user:pass@proxy.example.com:8080'
        )
        print(f"已创建认证上下文：{auth_context}")

asyncio.run(create_context_example())
```

### 列出上下文

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def list_contexts():
    async with Chrome() as browser:
        await browser.start()
        
        # 获取所有上下文（包括默认上下文）
        contexts = await browser.get_browser_contexts()
        print(f"初始上下文：{len(contexts)}")  # 通常为1（默认）
        
        # 创建额外的上下文
        context1 = await browser.create_browser_context()
        context2 = await browser.create_browser_context()
        
        # 再次列出
        contexts = await browser.get_browser_contexts()
        print(f"创建2个新上下文后：{len(contexts)}")  # 总计3个
        
        for i, context_id in enumerate(contexts):
            print(f"  上下文 {i+1}：{context_id}")
        
        # 清理
        await browser.delete_browser_context(context1)
        await browser.delete_browser_context(context2)

asyncio.run(list_contexts())
```

### 删除上下文

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def delete_context_example():
    async with Chrome() as browser:
        await browser.start()
        
        # 创建带标签页的上下文
        context_id = await browser.create_browser_context()
        tab1 = await browser.new_tab('https://example.com', browser_context_id=context_id)
        tab2 = await browser.new_tab('https://github.com', browser_context_id=context_id)
        
        print(f"已创建上下文 {context_id}，包含2个标签页")
        
        # 删除上下文会自动关闭其所有标签页
        await browser.delete_browser_context(context_id)
        print("上下文已删除（所有标签页自动关闭）")

asyncio.run(delete_context_example())
```

!!! warning "删除上下文会关闭所有标签页"
    删除浏览器上下文时，**属于该上下文的所有标签页会自动关闭**。这是一次清理多个标签页的高效方法，但请确保您已保存了任何重要数据。

## 默认上下文

每个浏览器都以包含初始标签页的**默认上下文**开始：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def default_context_example():
    async with Chrome() as browser:
        # 初始标签页位于默认上下文中
        initial_tab = await browser.start()
        
        # 创建标签页而不指定上下文 - 使用默认上下文
        default_tab = await browser.new_tab('https://example.com')
        
        # 创建自定义上下文
        custom_context = await browser.create_browser_context()
        custom_tab = await browser.new_tab('https://github.com', browser_context_id=custom_context)
        
        # 默认上下文和自定义上下文是隔离的
        await default_tab.execute_script("localStorage.setItem('type', 'default')")
        await custom_tab.execute_script("localStorage.setItem('type', 'custom')")
        
        # 验证隔离
        default_type = await default_tab.execute_script("return localStorage.getItem('type')")
        custom_type = await custom_tab.execute_script("return localStorage.getItem('type')")
        
        print(f"默认上下文：{default_type}")  # 'default'
        print(f"自定义上下文：{custom_type}")    # 'custom'
        
        # 清理自定义上下文
        await browser.delete_browser_context(custom_context)

asyncio.run(default_context_example())
```

!!! info "您无法删除默认上下文"
    默认浏览器上下文是永久性的，无法删除。它在整个浏览器会话期间存在。只有使用`create_browser_context()`创建的自定义上下文可以被删除。

## 高级模式

### 用于可重用隔离的上下文池

```python
import asyncio
from pydoll.browser.chromium import Chrome

class ContextPool:
    def __init__(self, browser, size=5):
        self.browser = browser
        self.size = size
        self.contexts = []
        self.in_use = set()
    
    async def initialize(self):
        """创建上下文池"""
        for _ in range(self.size):
            context_id = await self.browser.create_browser_context()
            self.contexts.append(context_id)
        print(f"上下文池已初始化，包含 {self.size} 个上下文")
    
    async def acquire(self):
        """从池中获取可用上下文"""
        for context_id in self.contexts:
            if context_id not in self.in_use:
                self.in_use.add(context_id)
                return context_id
        raise Exception("池中没有可用的上下文")
    
    def release(self, context_id):
        """将上下文返回到池"""
        self.in_use.discard(context_id)
    
    async def cleanup(self):
        """删除池中的所有上下文"""
        for context_id in self.contexts:
            await self.browser.delete_browser_context(context_id)

async def use_context_pool():
    async with Chrome() as browser:
        await browser.start()
        
        # 创建池
        pool = ContextPool(browser, size=3)
        await pool.initialize()
        
        # 从池中使用上下文
        async def scrape_with_pool(url):
            context_id = await pool.acquire()
            try:
                tab = await browser.new_tab(url, browser_context_id=context_id)
                await asyncio.sleep(2)
                title = await tab.execute_script('return document.title')
                await tab.close()
                return title
            finally:
                pool.release(context_id)
        
        # 使用池抓取多个URL
        urls = [f'https://example.com/page{i}' for i in range(10)]
        results = await asyncio.gather(*[scrape_with_pool(url) for url in urls])
        
        for i, title in enumerate(results):
            print(f"{urls[i]}: {title}")
        
        # 清理
        await pool.cleanup()

asyncio.run(use_context_pool())
```

### 每个上下文的配置管理器

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def context_config_manager():
    async with Chrome() as browser:
        await browser.start()
        
        # 为不同场景定义配置
        configs = {
            'us_user': {
                'proxy': 'http://us-proxy.example.com:8080',
                'user_agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64)'
            },
            'eu_user': {
                'proxy': 'http://eu-proxy.example.com:8080',
                'user_agent': 'Mozilla/5.0 (X11; Linux x86_64)'
            },
            'mobile_user': {
                'proxy': None,
                'user_agent': 'Mozilla/5.0 (iPhone; CPU iPhone OS 14_0 like Mac OS X)'
            }
        }
        
        contexts = {}
        
        # 为每个配置创建上下文
        for name, config in configs.items():
            if config['proxy']:
                context_id = await browser.create_browser_context(
                    proxy_server=config['proxy']
                )
            else:
                context_id = await browser.create_browser_context()
            
            # 创建标签页并设置用户代理
            tab = await browser.new_tab(browser_context_id=context_id)
            # 注意：用户代理将通过CDP或选项设置，此处简化
            
            contexts[name] = {'context_id': context_id, 'tab': tab}
        
        # 为不同场景使用不同上下文
        for name, data in contexts.items():
            tab = data['tab']
            await tab.go_to('https://httpbin.org/headers')
            await asyncio.sleep(2)
            print(f"\n{name} 配置已激活")
        
        # 清理
        for data in contexts.values():
            await data['tab'].close()
            await browser.delete_browser_context(data['context_id'])

asyncio.run(context_config_manager())
```

## 最佳实践

1. **对多个上下文使用无头模式**以避免窗口管理的复杂性
2. **使用完毕后始终删除上下文**以防止内存泄漏
3. **将相关操作分组在同一上下文中**以获得更好的组织
4. **优先使用上下文而非多个浏览器进程**以获得更好的性能
5. **使用上下文池**用于需要许多短期隔离环境的场景
6. **在删除上下文前关闭标签页**以获得更干净的清理（虽然不是严格要求）

## 另请参阅

- **[多标签管理](tabs.md)** - 管理上下文中的多个标签页
- **[深入探讨：Browser域](../../deep-dive/architecture/browser-domain.md)** - 上下文的架构细节
- **[网络：HTTP请求](../network/http-requests.md)** - 浏览器上下文请求继承上下文状态
- **[核心概念](../core-concepts.md)** - 理解Pydoll的架构

浏览器上下文是Pydoll创建复杂自动化工作流的最强大功能之一。通过理解它们的工作方式——特别是有头模式下的窗口行为及其轻量级特性——您可以构建高效、可扩展的自动化，轻松处理复杂的多环境场景。


================================================
FILE: docs/zh/features/browser-management/cookies-sessions.md
================================================
# Cookie 与会话管理

有效管理 Cookie 和会话对于真实的浏览器自动化至关重要。网站使用 Cookie 来跟踪身份验证、偏好设置和用户行为，并期望浏览器能相应地表现。

## 为什么 Cookie 对自动化很重要

Cookie 不仅仅是存储的数据：它们是浏览器活动的指纹：

- **身份验证**：会话 Cookie 在请求之间维护登录状态
- **跟踪防护**：反机器人系统分析 Cookie 模式
- **真实行为**：没有 Cookie 的浏览器看起来很可疑
- **会话持久性**：重用 Cookie 可以节省重复登录的时间

!!! warning "Cookie 悖论"
    - **太干净**：没有 Cookie 或历史记录的浏览器看起来像机器人
    - **太陈旧**：使用相同的会话数周会触发安全警报
    - **最佳点**：新鲜的 Cookie 配合偶尔的轮换和真实的活动模式

## 快速入门

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def basic_cookie_management():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # 设置 Cookie（使用简单的字典）
        cookies = [
            {
                'name': 'session_id',
                'value': 'abc123xyz',
                'domain': 'example.com',
                'path': '/',
                'secure': True,
                'httpOnly': True
            }
        ]
        await tab.set_cookies(cookies)
        
        # 获取所有 Cookie
        all_cookies = await browser.get_cookies()
        print(f"总 Cookie 数: {len(all_cookies)}")
        
        # 删除所有 Cookie
        await tab.delete_all_cookies()

asyncio.run(basic_cookie_management())
```

## 理解 Cookie 类型

!!! info "TypedDict：实践中使用常规字典"
    在本文档中，您会看到对 `CookieParam` 和 `Cookie` 的引用。这些是 **TypedDict** 类型，它们只是带有类型提示的常规 Python 字典，用于 IDE 自动完成和类型检查。
    
    **实际上，您使用常规字典：**
    ```python
    # 这是您实际编写的：
    cookie = {'name': 'session', 'value': 'abc123', 'domain': 'example.com'}
    
    # 类型注释只是为了您的 IDE：
    from pydoll.protocol.network.types import CookieParam
    cookie: CookieParam = {'name': 'session', 'value': 'abc123'}
    ```
    
    下面的所有示例为简单起见都使用普通字典。

### Cookie 结构

`Cookie` 类型（从浏览器检索）包含完整的 Cookie 信息：

```python
{
    "name": str,           # Cookie 名称
    "value": str,          # Cookie 值
    "domain": str,         # Cookie 有效的域
    "path": str,           # Cookie 有效的路径
    "expires": float,      # Unix 时间戳（0 = 会话 Cookie）
    "size": int,           # 大小（字节）
    "httpOnly": bool,      # 仅通过 HTTP 访问（不是 JavaScript）
    "secure": bool,        # 仅通过 HTTPS 发送
    "session": bool,       # 如果浏览器关闭时过期则为 True
    "sameSite": str,       # "Strict"、"Lax" 或 "None"
    "priority": str,       # "Low"、"Medium" 或 "High"
    "sourceScheme": str,   # "Unset"、"NonSecure" 或 "Secure"
    "sourcePort": int,     # 设置 Cookie 的端口
}
```

### CookieParam 结构

当**设置** Cookie 时，使用字典（只有 `name` 和 `value` 是必需的）：

```python
# 仅包含必需字段的简单 Cookie
cookie = {
    'name': 'user_token',
    'value': 'token_value'
}

# 包含所有可选字段的完整 Cookie
cookie = {
    'name': 'user_token',       # 必需
    'value': 'token_value',     # 必需
    'domain': 'example.com',    # 可选：默认为当前页面域
    'path': '/',                # 可选：默认为 /
    'secure': True,             # 可选：仅 HTTPS
    'httpOnly': True,           # 可选：无 JS 访问
    'sameSite': 'Lax',          # 可选：'Strict'、'Lax' 或 'None'
    'expires': 1735689600,      # 可选：Unix 时间戳
    'priority': 'High',         # 可选：'Low'、'Medium' 或 'High'
}
```

!!! info "可选字段默认行为"
    当您省略可选字段时：
    
    - `domain`：使用当前页面的域
    - `path`：默认为 `/`
    - `secure`：默认为 `False`
    - `httpOnly`：默认为 `False`
    - `sameSite`：浏览器的默认值（通常为 `Lax`）
    - `expires`：会话 Cookie（浏览器关闭时删除）

## Cookie 管理操作

### 设置 Cookie

#### 一次设置多个 Cookie

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def set_multiple_cookies():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        cookies = [
            {
                'name': 'session_id',
                'value': 'xyz789',
                'domain': 'example.com',
                'secure': True,
                'httpOnly': True,
                'sameSite': 'Strict'
            },
            {
                'name': 'preferences',
                'value': 'dark_mode=true',
                'domain': 'example.com',
                'path': '/settings'
            },
            {
                'name': 'analytics',
                'value': 'tracking_id_12345',
                'domain': 'example.com',
                'expires': 1735689600  # 在特定日期过期
            }
        ]
        
        await tab.set_cookies(cookies)
        print(f"设置了 {len(cookies)} 个 Cookie")

asyncio.run(set_multiple_cookies())
```

#### 在特定上下文中设置 Cookie

```python
# 在特定浏览器上下文中设置 Cookie
context_id = await browser.create_browser_context()
await browser.set_cookies(cookies, browser_context_id=context_id)
```

!!! tip "标签页与浏览器方法设置 Cookie"
    - `tab.set_cookies(cookies)`：在标签页的浏览器上下文中设置 Cookie（便捷快捷方式）
    - `browser.set_cookies(cookies, browser_context_id=...)`：使用显式上下文控制设置 Cookie
    
    两种方法都将 Cookie 添加到**整个上下文**，而不仅仅是当前页面。Cookie 将可用于该上下文中的所有标签页。

### 检索 Cookie

#### 获取所有 Cookie（上下文范围）

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def get_cookies_example():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://github.com')
        
        # 等待页面设置 Cookie
        await asyncio.sleep(2)
        
        # 选项 1：通过标签页获取 Cookie（当前上下文的快捷方式）
        cookies = await tab.get_cookies()
        
        # 选项 2：通过浏览器获取 Cookie（显式上下文控制）
        # cookies = await browser.get_cookies()  # 对于默认上下文与 tab.get_cookies() 相同
        
        print(f"找到 {len(cookies)} 个 Cookie：")
        for cookie in cookies:
            print(f"  - {cookie['name']}: {cookie['value'][:20]}...")
            print(f"    域: {cookie['domain']}, 安全: {cookie['secure']}")

asyncio.run(get_cookies_example())
```

!!! tip "标签页与浏览器方法"
    - `tab.get_cookies()`：从标签页的浏览器上下文返回 Cookie（便捷快捷方式）
    - `browser.get_cookies()`：从默认上下文返回 Cookie（或指定 `browser_context_id`）
    
    两种方法都返回上下文中的**所有 Cookie**，而不仅仅是当前页面域的 Cookie。

!!! warning "隐身模式限制"
    `browser.get_cookies()` 在原生隐身模式（`--incognito` 标志）下**不起作用**。这是 Chrome DevTools Protocol 的限制，`Storage.getCookies` 无法在原生隐身模式下访问 Cookie。
    
    **解决方法：** 改用 `tab.get_cookies()`，它使用 `Network.getCookies` 并在隐身模式下正常工作。

#### 从特定上下文获取 Cookie

```python
# 从特定浏览器上下文获取 Cookie
context_id = await browser.create_browser_context()
cookies = await browser.get_cookies(browser_context_id=context_id)
```

### 删除 Cookie

#### 删除所有 Cookie

```python
# 从当前标签页的上下文删除所有 Cookie
await tab.delete_all_cookies()

# 从特定上下文删除所有 Cookie
await browser.delete_all_cookies(browser_context_id=context_id)
```

!!! warning "Cookie 立即删除"
    当您删除 Cookie 时，它们会立即从浏览器中移除。网站可能直到下一次请求或页面重新加载才会检测到这一点。

## 实际用例

### 1. 持久登录会话

跨脚本运行重用身份验证 Cookie：

```python
import asyncio
import json
from pathlib import Path
from pydoll.browser.chromium import Chrome

COOKIE_FILE = Path('cookies.json')

async def save_cookies_after_login():
    """登录并保存 Cookie 供将来使用。"""
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/login')
        
        # 执行登录（简化）
        email = await tab.find(id='email')
        password = await tab.find(id='password')
        await email.type_text('user@example.com')
        await password.type_text('secret')
        
        login_btn = await tab.find(id='login')
        await login_btn.click()
        await asyncio.sleep(3)
        
        # 保存 Cookie
        cookies = await browser.get_cookies()
        COOKIE_FILE.write_text(json.dumps(cookies, indent=2))
        print(f"已将 {len(cookies)} 个 Cookie 保存到 {COOKIE_FILE}")

async def reuse_saved_cookies():
    """加载保存的 Cookie 以跳过登录。"""
    if not COOKIE_FILE.exists():
        print("未找到保存的 Cookie。请先运行 save_cookies_after_login()。")
        return
    
    # 从文件加载 Cookie
    saved_cookies = json.loads(COOKIE_FILE.read_text())
    
    # 转换为简化格式（仅必需字段）
    # 注意：get_cookies() 返回详细的 Cookie 对象，带有只读字段
    # （size、session、sourceScheme 等）。set_cookies() 期望 CookieParam
    # 格式，仅包含可设置的字段。
    cookies_to_set = [
        {
            'name': c['name'],
            'value': c['value'],
            'domain': c['domain'],
            'path': c.get('path', '/'),
            'secure': c.get('secure', False),
            'httpOnly': c.get('httpOnly', False)
        }
        for c in saved_cookies
    ]
    
    async with Chrome() as browser:
        tab = await browser.start()
        
        # 在导航之前设置 Cookie
        await tab.set_cookies(cookies_to_set)
        print(f"从文件加载了 {len(cookies_to_set)} 个 Cookie")
        
        # 导航 - 应该已经登录
        await tab.go_to('https://example.com/dashboard')
        await asyncio.sleep(2)
        
        # 验证登录
        try:
            username = await tab.find(class_name='username')
            print(f"登录为: {await username.text}")
        except Exception:
            print("登录失败 - Cookie 可能已过期")

# 首次运行：登录并保存 Cookie
# asyncio.run(save_cookies_after_login())

# 后续运行：重用 Cookie
asyncio.run(reuse_saved_cookies())
```

!!! note "需要重新格式化 Cookie"
    `get_cookies()` 返回**详细的 `Cookie` 对象**，带有只读属性如 `size`、`session`、`sourceScheme` 和 `sourcePort`。使用 `set_cookies()` 时，您必须提供 **`CookieParam` 格式**，仅包含可设置的字段（`name`、`value`、`domain`、`path`、`secure`、`httpOnly`、`sameSite`、`expires`、`priority`）。
    
    上面示例中的重新格式化步骤是**必不可少的**。将原始 `Cookie` 对象传递给 `set_cookies()` 可能会导致错误或意外行为。

!!! tip "Cookie 过期"
    始终检查保存的 Cookie 是否已过期。会话 Cookie（`session=True`）在浏览器关闭时过期，而持久性 Cookie 有一个您可以验证的 `expires` 时间戳。

### 2. 使用隔离 Cookie 进行多账户测试

每个浏览器上下文维护单独的 Cookie：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def test_multiple_accounts():
    accounts = [
        {'email': 'user1@example.com', 'cookie_value': 'session_user1'},
        {'email': 'user2@example.com', 'cookie_value': 'session_user2'},
    ]
    
    async with Chrome() as browser:
        initial_tab = await browser.start()
        
        # 默认上下文中的第一个账户
        cookies_user1 = [{
            'name': 'session',
            'value': accounts[0]['cookie_value'],
            'domain': 'example.com',
            'secure': True,
            'httpOnly': True
        }]
        await initial_tab.set_cookies(cookies_user1)
        await initial_tab.go_to('https://example.com/dashboard')
        
        # 隔离上下文中的第二个账户
        context2 = await browser.create_browser_context()
        tab2 = await browser.new_tab(browser_context_id=context2)
        
        cookies_user2 = [{
            'name': 'session',
            'value': accounts[1]['cookie_value'],
            'domain': 'example.com',
            'secure': True,
            'httpOnly': True
        }]
        await browser.set_cookies(cookies_user2, browser_context_id=context2)
        await tab2.go_to('https://example.com/dashboard')
        
        # 两个用户使用不同的会话同时登录
        print("用户 1 和用户 2 使用隔离的 Cookie 登录")
        
        await asyncio.sleep(5)
        
        # 清理
        await tab2.close()
        await browser.delete_browser_context(context2)

asyncio.run(test_multiple_accounts())
```

### 3. 长时间运行脚本的 Cookie 轮换

定期刷新 Cookie 以避免检测：

```python
import asyncio
import time
from pydoll.browser.chromium import Chrome

async def scrape_with_cookie_rotation():
    urls = [f'https://example.com/page{i}' for i in range(100)]
    
    async with Chrome() as browser:
        tab = await browser.start()
        
        # 最初登录
        await tab.go_to('https://example.com/login')
        # ... 执行登录 ...
        await asyncio.sleep(2)
        
        last_rotation = time.time()
        rotation_interval = 600  # 每 10 分钟轮换一次
        
        for url in urls:
            # 检查是否是轮换 Cookie 的时候
            if time.time() - last_rotation > rotation_interval:
                print("轮换会话...")
                
                # 删除旧 Cookie
                await tab.delete_all_cookies()
                
                # 重新登录或加载新 Cookie
                await tab.go_to('https://example.com/login')
                # ... 再次执行登录 ...
                
                last_rotation = time.time()
            
            # 抓取页面
            await tab.go_to(url)
            await asyncio.sleep(2)
            # ... 提取数据 ...

asyncio.run(scrape_with_cookie_rotation())
```

!!! tip "轮换频率"
    理想的轮换频率取决于您的用例：
    
    - **高安全性网站**：每 5-15 分钟轮换一次
    - **普通网站**：每 30-60 分钟轮换一次
    - **低风险抓取**：每几小时轮换一次


## Cookie 属性参考

| 属性 | 类型 | 描述 | 默认值 |
|-----------|------|-------------|---------|
| `name` | `str` | Cookie 名称 | *必需* |
| `value` | `str` | Cookie 值 | *必需* |
| `domain` | `str` | Cookie 有效的域 | 当前页面域 |
| `path` | `str` | Cookie 有效的路径 | `/` |
| `secure` | `bool` | 仅通过 HTTPS 发送 | `False` |
| `httpOnly` | `bool` | 无法通过 JavaScript 访问 | `False` |
| `sameSite` | `CookieSameSite` | CSRF 保护：`Strict`、`Lax`、`None` | 浏览器默认（`Lax`）|
| `expires` | `float` | Unix 时间戳（0 = 会话 Cookie）| `0`（会话）|
| `priority` | `CookiePriority` | Cookie 优先级：`Low`、`Medium`、`High` | `Medium` |

### SameSite 值

```python
# 在您的 Cookie 字典中直接使用字符串值：

'sameSite': 'Strict'  # 仅为同站点请求发送 Cookie
'sameSite': 'Lax'     # 为顶级导航发送 Cookie（默认）
'sameSite': 'None'    # 为所有请求发送 Cookie（需要 secure=True）

# 或使用枚举获得 IDE 自动完成：
from pydoll.protocol.network.types import CookieSameSite

cookie = {
    'name': 'session',
    'value': 'xyz',
    'sameSite': CookieSameSite.STRICT  # IDE 将自动完成：STRICT、LAX、NONE
}
```

### Priority 值

```python
# 直接使用字符串值：

'priority': 'Low'     # 低优先级（需要空间时首先删除）
'priority': 'Medium'  # 中优先级（默认）
'priority': 'High'    # 高优先级（最后删除）

# 或使用枚举：
from pydoll.protocol.network.types import CookiePriority

cookie = {
    'name': 'session',
    'value': 'xyz',
    'priority': CookiePriority.HIGH  # IDE 将自动完成：LOW、MEDIUM、HIGH
}
```

## 常见模式

### 临时 Cookie 的上下文管理器

```python
from contextlib import asynccontextmanager

@asynccontextmanager
async def temporary_cookies(browser, tab, cookies):
    """设置 Cookie，执行代码，然后恢复原始 Cookie。"""
    # 保存当前 Cookie
    original_cookies = await browser.get_cookies()
    
    try:
        # 设置临时 Cookie
        await tab.delete_all_cookies()
        await tab.set_cookies(cookies)
        yield tab
    finally:
        # 恢复原始 Cookie
        await tab.delete_all_cookies()
        cookies_to_restore = [
            {
                'name': c['name'],
                'value': c['value'],
                'domain': c['domain'],
                'path': c.get('path', '/')
            }
            for c in original_cookies
        ]
        await tab.set_cookies(cookies_to_restore)

# 使用
async with temporary_cookies(browser, tab, test_cookies):
    await tab.go_to('https://example.com')
    # ... 使用临时 Cookie 执行操作 ...
# 原始 Cookie 自动恢复
```

!!! tip "使用公共 API"
    此上下文管理器接受 `browser` 和 `tab` 作为参数以使用公共 API。由于 `tab` 不将其父 `browser` 作为公共属性公开，因此显式传递它是访问浏览器级方法的推荐方法。

### Cookie 指纹比较

```python
def cookie_fingerprint(cookies):
    """生成 Cookie 状态的简单指纹。"""
    return {
        'count': len(cookies),
        'domains': set(c['domain'] for c in cookies),
        'names': sorted(c['name'] for c in cookies),
        'secure_count': sum(1 for c in cookies if c.get('secure')),
        'httponly_count': sum(1 for c in cookies if c.get('httpOnly')),
    }

# 比较 Cookie 状态
before = await browser.get_cookies()
await tab.go_to('https://example.com')
after = await browser.get_cookies()

print(f"之前: {cookie_fingerprint(before)}")
print(f"之后: {cookie_fingerprint(after)}")
```

## 安全注意事项

!!! danger "切勿硬编码敏感 Cookie"
    始终从安全存储（环境变量、加密文件、密钥管理器）加载身份验证 Cookie。
    
    ```python
    # ❌ 不好 - 在代码中硬编码
    cookies = [{'name': 'session', 'value': 'abc123secret'}]
    
    # ✅ 好 - 从环境加载
    import os
    cookies = [{
        'name': 'session',
        'value': os.getenv('SESSION_COOKIE'),
        'domain': os.getenv('COOKIE_DOMAIN')
    }]
    ```

!!! warning "Cookie 盗窃保护"
    将 Cookie 保存到磁盘时：
    
    - 使用加密存储（例如，`cryptography` 库）
    - 设置限制性文件权限
    - 切勿将 Cookie 文件提交到版本控制
    - 定期轮换 Cookie

## 最佳实践总结

1. **从真实 Cookie 开始** - 不要在完全干净的浏览器中运行自动化
2. **定期轮换会话** - 避免长时间使用相同的 Cookie
3. **尊重 Cookie 安全属性** - 适当使用 `secure`、`httpOnly`、`sameSite`
4. **保存和重用身份验证 Cookie** - 适当时跳过重复登录
5. **隔离多账户测试的上下文** - 每个上下文都有独立的 Cookie
6. **监控 Cookie 演变** - 真实浏览自然会积累 Cookie
7. **清理过期的 Cookie** - 重用前删除无效 Cookie
8. **使用安全存储** - 加密保存的 Cookie，切勿硬编码密钥

## 另请参阅

- **[浏览器上下文](contexts.md)** - 隔离的 Cookie 环境
- **[HTTP 请求](../network/http-requests.md)** - 浏览器上下文请求自动继承 Cookie
- **[类人交互](../automation/human-interactions.md)** - 将 Cookie 与真实行为结合
- **[API 参考：存储命令](/api/commands/storage_commands/)** - 完整的 CDP Cookie 方法

有效的 Cookie 管理是真实浏览器自动化的基础。通过平衡新鲜度与持久性并尊重安全属性，您可以构建表现得像真实用户一样的自动化，同时保持高效和可维护性。


================================================
FILE: docs/zh/features/browser-management/tabs.md
================================================
# 多标签页管理

Pydoll 提供了强大的多标签页功能，可以实现跨多个浏览器标签页同时进行复杂的自动化工作流。理解 Pydoll 中标签页的工作原理对于构建健壮、可扩展的自动化至关重要。

## 理解 Pydoll 中的标签页

在 Pydoll 中，`Tab` 实例代表单个浏览器标签页（或窗口），并提供所有页面自动化操作的主要接口。每个标签页维护自己的：

- **独立执行上下文**：JavaScript、DOM 和页面状态
- **隔离的事件处理器**：在一个标签页上注册的回调不会影响其他标签页
- **独立的网络监控**：每个标签页可以跟踪自己的网络活动
- **唯一的 CDP 连接**：与浏览器的直接 WebSocket 通信

```mermaid
graph LR
    Browser[浏览器实例] --> Tab1[标签页 1]
    Browser --> Tab2[标签页 2]
    Browser --> Tab3[...]
    
    Tab1 --> Features1[独立<br/>上下文]
    Tab2 --> Features2[独立<br/>上下文]
```

| 标签页组件 | 描述 | 独立性 |
|-----------|------|--------|
| **执行上下文** | JavaScript 运行时、DOM、页面状态 | ✓ 每个标签页都有自己的 |
| **事件处理器** | CDP 事件的注册回调 | ✓ 每个标签页隔离 |
| **网络监控** | HTTP 请求、响应、时序 | ✓ 单独跟踪 |
| **CDP 连接** | WebSocket 通信通道 | ✓ 直接连接 |

### 什么是浏览器标签页？

浏览器标签页在技术上是一个 **CDP 目标** - 一个具有自己的隔离浏览上下文：

- 文档对象模型（DOM）
- JavaScript 执行环境
- 网络连接池
- Cookie 存储（与同一上下文中的其他标签页共享）
- 事件循环和渲染引擎

每个标签页都有浏览器分配的唯一 `target_id`，Pydoll 使用它来正确路由命令和事件。

## 标签页实例管理

Pydoll 的 `Browser` 类根据每个标签页的 `target_id` 维护一个 Tab 实例注册表。这确保对同一浏览器标签页的多个引用始终返回相同的 Tab 对象。Browser 将这些实例存储在内部的 `_tabs_opened` 字典中。

| 优势 | 描述 |
|------|------|
| **资源效率** | 每个浏览器标签页一个 Tab 实例，无重复 |
| **状态一致** | 所有引用共享相同的事件处理器和状态 |
| **内存安全** | 防止与同一目标建立多个 WebSocket 连接 |
| **可预测的行为** | 一个引用的变化会影响所有引用 |

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def tab_registry_demonstration():
    async with Chrome() as browser:
        # 启动浏览器并获取初始标签页
        tab1 = await browser.start()

        # 通过不同方法获取同一标签页
        # 注意：get_opened_tabs() 以相反顺序返回标签页（最新的在前）
        # 所以初始标签页（最旧的）在最后
        opened_tabs = await browser.get_opened_tabs()
        tab2 = opened_tabs[-1]  # 初始标签页是最旧的，所以在最后

        # 两个引用指向同一对象
        # 因为 Browser 从其注册表返回相同的实例
        print(f"Same instance? {tab1 is tab2}")  # True
        print(f"Same target ID? {tab1._target_id == tab2._target_id}")  # True

        # 在一个引用上注册事件会影响另一个
        await tab1.enable_network_events()
        print(f"Network events on tab2? {tab2.network_events_enabled}")  # True

        # Browser 在内部维护注册表
        print(f"Tab registered in browser? {tab1._target_id in browser._tabs_opened}")  # True

asyncio.run(tab_registry_demonstration())
```

!!! info "Browser 管理的注册表"
    Browser 类管理一个以 `target_id` 为键的 `_tabs_opened` 字典。当你请求一个标签页（通过 `new_tab()` 或 `get_opened_tabs()`）时，Browser 会先检查该注册表。如果已经存在对应的 Tab，就复用该实例；否则创建新的并缓存。（IFrame 现在作为普通元素处理，不再注册为独立的 Tab。）

## 创建和管理标签页

### 启动浏览器

启动浏览器时，Pydoll 自动为初始浏览器标签页创建并返回一个 Tab 实例：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def start_browser():
    async with Chrome() as browser:
        # 自动创建初始标签页
        tab = await browser.start()
        
        print(f"Tab created with target ID: {tab._target_id}")
        await tab.go_to('https://example.com')
        
        title = await tab.execute_script('return document.title')
        print(f"Page title: {title}")

asyncio.run(start_browser())
```

### 以编程方式创建额外的标签页

使用 `browser.new_tab()` 完全控制创建额外的标签页：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def create_multiple_tabs():
    async with Chrome() as browser:
        # 从初始标签页开始
        main_tab = await browser.start()
        
        # 创建带有特定 URL 的额外标签页
        search_tab = await browser.new_tab('https://google.com')
        docs_tab = await browser.new_tab('https://docs.python.org')
        news_tab = await browser.new_tab('https://news.ycombinator.com')
        
        # 每个标签页可以独立控制
        await search_tab.find(name='q')  # Google 搜索框
        await docs_tab.find(id='search-field')  # Python 文档搜索
        await news_tab.find(class_name='storylink', find_all=True)  # HN 故事
        
        # 获取所有打开的标签页
        all_tabs = await browser.get_opened_tabs()
        print(f"Total tabs: {len(all_tabs)}")  # 4（初始 + 3 个新的）
        
        # 完成后关闭特定标签页
        await search_tab.close()
        await docs_tab.close()
        await news_tab.close()

asyncio.run(create_multiple_tabs())
```

!!! tip "URL 参数可选"
    你可以创建不指定 URL 的标签页：`await browser.new_tab()`。标签页将打开空白页面（`about:blank`），准备导航。

### 处理用户打开的标签页

当用户点击带有 `target="_blank"` 的链接或使用"在新标签页中打开"时，Pydoll 可以检测并管理这些标签页：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def handle_user_tabs():
    async with Chrome() as browser:
        main_tab = await browser.start()
        await main_tab.go_to('https://example.com')
        
        # 记录初始标签页数量
        initial_tabs = await browser.get_opened_tabs()
        print(f"Initial tabs: {len(initial_tabs)}")
        
        # 点击在新标签页中打开的链接（target="_blank"）
        external_link = await main_tab.find(text='Open in New Tab')
        await external_link.click()
        
        # 等待新标签页打开
        await asyncio.sleep(2)
        
        # 检测新标签页
        current_tabs = await browser.get_opened_tabs()
        print(f"Current tabs: {len(current_tabs)}")
        
        # 找到新打开的标签页（列表中的最后一个）
        if len(current_tabs) > len(initial_tabs):
            new_tab = current_tabs[-1]
            
            # 使用新标签页
            url = await new_tab.current_url
            print(f"New tab URL: {url}")
            
            await new_tab.go_to('https://different-site.com')
            title = await new_tab.execute_script('return document.title')
            print(f"New tab title: {title}")
            
            # 完成后关闭
            await new_tab.close()

asyncio.run(handle_user_tabs())
```

### 列出所有打开的标签页

使用 `browser.get_opened_tabs()` 检索所有当前打开的标签页：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def list_tabs():
    async with Chrome() as browser:
        # 使用 start() 返回的初始标签页
        initial_tab = await browser.start()
        await initial_tab.go_to('https://example.com')
        
        # 再打开几个标签页
        await browser.new_tab('https://github.com')
        await browser.new_tab('https://stackoverflow.com')
        await browser.new_tab('https://reddit.com')
        
        # 获取所有标签页
        all_tabs = await browser.get_opened_tabs()
        
        # 检查每个标签页
        for i, tab in enumerate(all_tabs, 1):
            url = await tab.current_url
            title = await tab.execute_script('return document.title')
            print(f"Tab {i}: {title} - {url}")

asyncio.run(list_tabs())
```

## 并发标签页操作

Pydoll 的异步架构支持跨多个标签页的强大并发工作流：

### 并行数据收集

同时处理多个页面以获得最大效率：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def scrape_page(tab, url):
    """在给定标签页中抓取单个页面。"""
    await tab.go_to(url)
    title = await tab.execute_script('return document.title')
    articles = await tab.find(class_name='article', find_all=True)
    content = [await article.text for article in articles[:5]]

    return {
        'url': url,
        'title': title,
        'articles_count': len(articles),
        'sample_content': content
    }

async def concurrent_scraping():
    urls = [
        'https://example.com/page1',
        'https://example.com/page2',
        'https://example.com/page3',
        'https://example.com/page4',
    ]

    async with Chrome() as browser:
        # 启动浏览器并打开第一个标签页
        initial_tab = await browser.start()
        # 为每个 URL 创建一个标签页
        tabs = [initial_tab] + [await browser.new_tab() for _ in urls[1:]]

        # 并发运行所有爬虫
        results = await asyncio.gather(*[
            scrape_page(tab, url) for tab, url in zip(tabs, urls)
        ])

        # 显示结果
        for result in results:
            print(f"\n{result['title']}")
            print(f"  URL: {result['url']}")
            print(f"  Articles: {result['articles_count']}")
            if result['sample_content']:
                print(f"  Sample: {result['sample_content'][0][:100]}...")

asyncio.run(concurrent_scraping())
```

!!! tip "性能提升"
    与顺序处理相比，并发抓取可以将总执行时间减少 5-10 倍，特别是对于 I/O 密集型任务如页面加载。

### 协调多标签页工作流

编排需要多个标签页交互的复杂工作流：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.network.events import NetworkEvent, RequestWillBeSentEvent

async def multi_tab_workflow():
    async with Chrome() as browser:
        # 使用初始标签页进行登录
        login_tab = await browser.start()
        await login_tab.go_to('https://app.example.com/login')
        await asyncio.sleep(2)
        
        username = await login_tab.find(id='username')
        password = await login_tab.find(id='password')
        
        await username.type_text('admin@example.com')
        await password.type_text('secure_password')
        
        login_btn = await login_tab.find(id='login')
        await login_btn.click()
        await asyncio.sleep(3)
        
        # 标签页 2：导航到数据导出页面
        export_tab = await browser.new_tab('https://app.example.com/export')
        await asyncio.sleep(2)
        
        export_btn = await export_tab.find(text='Export Data')
        await export_btn.click()
        
        # 标签页 3：在仪表板中监控 API 调用
        monitor_tab = await browser.new_tab('https://app.example.com/dashboard')
        await monitor_tab.enable_network_events()
        
        # 跟踪 API 调用
        api_calls = []
        async def track_api(event: RequestWillBeSentEvent):
            url = event['params']['request']['url']
            if '/api/' in url:
                api_calls.append(url)
        
        await monitor_tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, track_api)
        await asyncio.sleep(5)
        
        print(f"Tracked {len(api_calls)} API calls:")
        for call in api_calls[:10]:
            print(f"  - {call}")
        
        # 清理
        await login_tab.close()
        await export_tab.close()
        await monitor_tab.close()

asyncio.run(multi_tab_workflow())
```

## 标签页生命周期和清理

### 显式标签页关闭

完成后始终关闭标签页以释放浏览器资源：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def explicit_cleanup():
    async with Chrome() as browser:
        initial_tab = await browser.start()
        
        # 为不同任务创建标签页
        tab1 = await browser.new_tab('https://example.com')
        tab2 = await browser.new_tab('https://example.org')
        
        # 使用标签页进行工作
        await tab1.go_to('https://different-site.com')
        await tab2.take_screenshot('/tmp/screenshot.png')
        
        # 显式关闭标签页
        await tab1.close()
        await tab2.close()
        
        # 验证标签页已关闭
        remaining = await browser.get_opened_tabs()
        print(f"Remaining tabs: {len(remaining)}")  # 应该是 1（初始）

asyncio.run(explicit_cleanup())
```

!!! warning "内存泄漏"
    在长时间运行的自动化中不关闭标签页可能导致内存耗尽。每个标签页消耗浏览器资源（内存、文件句柄、网络连接）。

### 使用上下文管理器自动清理

虽然 Pydoll 没有提供内置的标签页上下文管理器，但你可以创建自己的：

```python
import asyncio
from contextlib import asynccontextmanager
from pydoll.browser.chromium import Chrome

@asynccontextmanager
async def managed_tab(browser, url=None):
    """用于自动清理标签页的上下文管理器。"""
    tab = await browser.new_tab(url)
    try:
        yield tab
    finally:
        await tab.close()

async def auto_cleanup_example():
    async with Chrome() as browser:
        initial_tab = await browser.start()
        
        # 退出上下文时标签页自动关闭
        async with managed_tab(browser, 'https://example.com') as tab:
            title = await tab.execute_script('return document.title')
            print(f"Title: {title}")
            
            await tab.take_screenshot('/tmp/page.png')
        # 标签页在这里自动关闭
        
        tabs = await browser.get_opened_tabs()
        print(f"Tabs after context exit: {len(tabs)}")  # 1（仅 initial_tab）

asyncio.run(auto_cleanup_example())
```

### 浏览器清理

浏览器关闭时，所有标签页会自动关闭：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def browser_cleanup():
    # 使用上下文管理器 - 自动清理
    async with Chrome() as browser:
        initial_tab = await browser.start()
        
        # 创建多个标签页
        await browser.new_tab('https://example.com')
        await browser.new_tab('https://github.com')
        await browser.new_tab('https://stackoverflow.com')
        
        tabs = await browser.get_opened_tabs()
        print(f"Tabs open: {len(tabs)}")  # 4（初始 + 3 个新的）
    
    # 浏览器退出时所有标签页自动关闭
    print("Browser closed, all tabs cleaned up")

asyncio.run(browser_cleanup())
```

## 标签页状态管理

### 检查标签页状态

查询标签页当前状态的各个方面：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def check_tab_state():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # 检查当前 URL
        url = await tab.current_url
        print(f"Current URL: {url}")
        
        # 检查页面源代码
        source = await tab.page_source
        print(f"Page source length: {len(source)} characters")
        
        # 检查已启用的事件域
        print(f"Page events enabled: {tab.page_events_enabled}")
        print(f"Network events enabled: {tab.network_events_enabled}")
        print(f"DOM events enabled: {tab.dom_events_enabled}")
        
        # 启用事件并再次检查
        await tab.enable_network_events()
        print(f"Network events enabled: {tab.network_events_enabled}")  # True

asyncio.run(check_tab_state())
```

### 标签页标识

每个标签页都有唯一标识符：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def tab_identification():
    async with Chrome() as browser:
        tab1 = await browser.start()
        tab2 = await browser.new_tab()
        
        # Target ID - 浏览器分配的唯一标识符
        print(f"Tab 1 target ID: {tab1._target_id}")
        print(f"Tab 2 target ID: {tab2._target_id}")
        
        # 连接详情
        print(f"Tab 1 connection port: {tab1._connection_port}")
        print(f"Tab 2 connection port: {tab2._connection_port}")
        
        # 浏览器上下文 ID（默认上下文通常为 None）
        print(f"Tab 1 context ID: {tab1._browser_context_id}")
        print(f"Tab 2 context ID: {tab2._browser_context_id}")

asyncio.run(tab_identification())
```

## 高级标签页功能

### 将标签页置于前台

使特定标签页可见（置于前台）：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def bring_to_front():
    async with Chrome() as browser:
        tab1 = await browser.start()
        tab2 = await browser.new_tab('https://github.com')
        tab3 = await browser.new_tab('https://stackoverflow.com')
        
        # tab3 当前在前台（最后创建的）
        await asyncio.sleep(2)
        
        # 将 tab1 置于前台
        await tab1.bring_to_front()
        print("Tab 1 brought to front")
        
        await asyncio.sleep(2)
        
        # 将 tab2 置于前台
        await tab2.bring_to_front()
        print("Tab 2 brought to front")

asyncio.run(bring_to_front())
```

### 标签页特定的网络监控

每个标签页可以独立监控自己的网络活动：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def tab_network_monitoring():
    async with Chrome() as browser:
        # 使用初始标签页进行监控导航
        tab1 = await browser.start()
        await tab1.go_to('https://example.com')
        
        # 创建第二个标签页不进行监控
        tab2 = await browser.new_tab('https://github.com')
        
        # 仅在 tab1 上启用网络监控
        await tab1.enable_network_events()
        
        # 导航两个标签页
        await tab1.go_to('https://example.com/page1')
        await tab2.go_to('https://github.com/explore')
        
        await asyncio.sleep(3)
        
        # 仅从 tab1 获取网络日志
        tab1_logs = await tab1.get_network_logs()
        print(f"Tab 1 network requests: {len(tab1_logs)}")
        
        # tab2 没有网络监控
        print(f"Tab 2 network events enabled: {tab2.network_events_enabled}")  # False

asyncio.run(tab_network_monitoring())
```

### 标签页特定的事件处理器

在不同标签页上注册不同的事件处理器：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.page.events import PageEvent

async def tab_specific_events():
    async with Chrome() as browser:
        # 使用初始标签页作为第一个标签页
        tab1 = await browser.start()
        tab2 = await browser.new_tab()
        
        # 在两个标签页上启用页面事件
        await tab1.enable_page_events()
        await tab2.enable_page_events()
        
        # 为每个标签页使用不同的处理器
        async def tab1_handler(event):
            print("Tab 1 loaded!")
        
        async def tab2_handler(event):
            print("Tab 2 loaded!")
        
        await tab1.on(PageEvent.LOAD_EVENT_FIRED, tab1_handler)
        await tab2.on(PageEvent.LOAD_EVENT_FIRED, tab2_handler)
        
        # 导航两个标签页
        await tab1.go_to('https://example.com')
        await tab2.go_to('https://github.com')
        
        await asyncio.sleep(2)

asyncio.run(tab_specific_events())
```

## 性能考虑

| 场景 | 资源影响 | 建议 |
|------|---------|------|
| **1-5 个标签页** | 低 | 直接管理，无需特殊处理 |
| **5-20 个标签页** | 中等 | 使用信号量限制并发 |
| **20-50 个标签页** | 高 | 批处理，积极关闭标签页 |
| **50+ 个标签页** | 非常高 | 考虑顺序处理或多个浏览器 |

### 内存使用

每个标签页大约消耗：

- **基础内存**：50-100 MB
- **启用网络事件**：+10-20 MB
- **启用 DOM 事件**：+20-50 MB
- **复杂页面（SPA）**：+100-300 MB

20 个启用网络监控的标签页：约 1.5-3 GB 内存。

## 常见模式

### 使用单个标签页的顺序处理

```python
async def sequential_pattern():
    async with Chrome() as browser:
        tab = await browser.start()
        
        for url in urls:
            await tab.go_to(url)
            # 提取数据
            await tab.clear_callbacks()  # 清理事件

asyncio.run(sequential_pattern())
```

### 使用多个标签页的并行处理

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def parallel_pattern():
    urls = [
        'https://example.com/page1',
        'https://example.com/page2',
        'https://example.com/page3',
        'https://example.com/page4',
    ]

    async with Chrome() as browser:
        # 启动浏览器并获取初始标签页
        initial_tab = await browser.start()
        # 为每个 URL 创建一个标签页（为第一个重用初始标签页）
        tabs = [initial_tab] + [await browser.new_tab() for _ in urls[1:]]

        async def process_page(tab, url):
            """在给定标签页中处理单个页面。"""
            try:
                await tab.go_to(url)
                await asyncio.sleep(2)
                title = await tab.evaluate('document.title')
                print(f"[{url}] {title}")
            finally:
                if tab is not initial_tab:
                    await tab.close()

        # 并发运行所有标签页
        await asyncio.gather(*[
            process_page(tab, url) for tab, url in zip(tabs, urls)
        ])

asyncio.run(parallel_pattern())
```

### 工作池模式

```python
async def worker_pool_pattern():
    async with Chrome() as browser:
        # 使用初始标签页作为第一个工作者
        initial_tab = await browser.start()
        
        # 创建额外的工作者标签页（总共 5 个工作者：1 个初始 + 4 个新的）
        workers = [initial_tab] + [await browser.new_tab() for _ in range(4)]
        
        # 在所有工作者之间分配工作
        for url in urls:
            worker = workers[urls.index(url) % len(workers)]
            await worker.go_to(url)
            # 处理...
        
        # 清理所有工作者（包括初始标签页）
        for worker in workers:
            await worker.close()

asyncio.run(worker_pool_pattern())
```

!!! tip "重用初始标签页"
    始终使用 `browser.start()` 返回的标签页，而不是让它空闲。这可以节省浏览器资源并提高性能。在上面的示例中，初始标签页被重用作为第一个工作者或批处理中的第一个 URL。

## 另请参阅

- **[浏览器上下文](contexts.md)** - 隔离的浏览器会话
- **[Cookie 和会话](cookies-sessions.md)** - 跨标签页管理 cookie
- **[事件系统](../advanced/event-system.md)** - 标签页特定的事件处理
- **[并发抓取](../../features.md#concurrent-scraping)** - 实际示例

Pydoll 中的多标签页管理为构建可扩展、高效的浏览器自动化提供了基础。通过理解标签页生命周期、单例模式和最佳实践，你可以创建健壮的自动化工作流，轻松处理复杂的多页面场景。


================================================
FILE: docs/zh/features/configuration/browser-options.md
================================================
# 浏览器选项 (ChromiumOptions)

`ChromiumOptions` 是自定义浏览器行为的中央配置中心。它控制从命令行参数和二进制文件位置到页面加载状态和内容偏好的所有内容。

!!! info "相关文档"
    - **[浏览器偏好设置](browser-preferences.md)** - 深入了解 Chromium 的内部偏好系统
    - **[浏览器管理](../browser-management/tabs.md)** - 使用浏览器实例和标签页
    - **[上下文](../browser-management/contexts.md)** - 隔离的浏览上下文

## 快速入门

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions
from pydoll.constants import PageLoadState

async def main():
    # 创建并配置选项
    options = ChromiumOptions()
    
    # 基本配置
    options.headless = True
    options.start_timeout = 15
    options.page_load_state = PageLoadState.INTERACTIVE
    
    # 添加命令行参数
    options.add_argument('--disable-gpu')
    options.add_argument('--window-size=1920,1080')
    
    # 常见设置的辅助方法
    options.block_notifications = True
    options.block_popups = True
    options.set_default_download_directory('/tmp/downloads')
    
    # 使用配置的选项
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')

asyncio.run(main())
```

## 核心属性

### 命令行参数

Chromium 支持数百个控制浏览器行为的命令行开关。使用 `add_argument()` 直接将标志传递给浏览器进程。

```python
options = ChromiumOptions()

# 添加单个参数
options.add_argument('--disable-blink-features=AutomationControlled')

# 添加带值的参数
options.add_argument('--window-size=1920,1080')
options.add_argument('--user-agent=Mozilla/5.0 ...')

# 如需要可删除参数
options.remove_argument('--window-size=1920,1080')

# 获取所有参数
all_args = options.arguments
```

!!! tip "参数格式"
    - 以 `--` 开头的参数是标志：`--headless`、`--disable-gpu`
    - 带 `=` 的参数有值：`--window-size=1920,1080`
    - 有些接受多个值：`--disable-features=Feature1,Feature2`

**请参阅下面的[命令行参数参考](#命令行参数参考)获取完整列表。**

### 二进制文件位置

指定自定义浏览器可执行文件而不是使用系统默认值：

```python
options = ChromiumOptions()

# Linux
options.binary_location = '/opt/google/chrome-beta/chrome'

# macOS
options.binary_location = '/Applications/Google Chrome Canary.app/Contents/MacOS/Google Chrome Canary'

# Windows
options.binary_location = r'C:\Program Files\Google\Chrome Beta\Application\chrome.exe'
```

!!! info "何时设置二进制位置"
    - 测试不同的 Chrome 版本（Stable、Beta、Canary）
    - 使用 Chromium 而不是 Chrome
    - 使用便携式浏览器安装
    - 运行特定构建进行调试

### 启动超时

控制 Pydoll 等待浏览器启动和响应的时间：

```python
options = ChromiumOptions()
options.start_timeout = 20  # 秒（默认：10）
```

!!! warning "超时注意事项"
    - **太低**：浏览器可能无法完全初始化，导致启动失败
    - **太高**：挂起会阻塞您的自动化更长时间
    - **推荐**：大多数情况下 10-15 秒，慢速系统或大型浏览器配置文件 20-30 秒

### 无头模式

在没有可见 UI 的情况下运行浏览器：

```python
options = ChromiumOptions()
options.headless = True  # 自动添加 --headless 参数

# 或手动
options.add_argument('--headless')
options.add_argument('--headless=new')  # 新的无头模式（Chrome 109+）
```

| 模式 | 参数 | 描述 |
|------|----------|-------------|
| **有头** | (无) | 可见的浏览器窗口（默认）|
| **经典无头** | `--headless` | 旧版无头模式 |
| **新无头** | `--headless=new` | 现代无头（Chrome 109+，更好的兼容性）|

!!! tip "新无头模式"
    `--headless=new` 模式（Chrome 109+）提供更好的现代 Web 功能兼容性，更难检测。在生产自动化中使用它。

### 页面加载状态

控制 `tab.go_to()` 何时认为页面"已加载"：

```python
from pydoll.constants import PageLoadState

options = ChromiumOptions()
options.page_load_state = PageLoadState.INTERACTIVE  # 或 PageLoadState.COMPLETE
```

| 状态 | 导航完成时 | 用例 |
|-------|---------------------------|----------|
| `COMPLETE`（默认）| 触发 `load` 事件，所有资源已加载 | 等待图像、字体、脚本 |
| `INTERACTIVE` | 触发 `DOMContentLoaded`，DOM 就绪 | 更快的导航，立即与 DOM 交互 |

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions
from pydoll.constants import PageLoadState

async def compare_load_states():
    # 完整模式 - 等待所有内容
    options_complete = ChromiumOptions()
    options_complete.page_load_state = PageLoadState.COMPLETE
    
    async with Chrome(options=options_complete) as browser:
        tab = await browser.start()
        
        import time
        start = time.time()
        await tab.go_to('https://example.com')
        complete_time = time.time() - start
        print(f"COMPLETE 模式: {complete_time:.2f}s")
    
    # 交互模式 - DOM 就绪就足够了
    options_interactive = ChromiumOptions()
    options_interactive.page_load_state = PageLoadState.INTERACTIVE
    
    async with Chrome(options=options_interactive) as browser:
        tab = await browser.start()
        
        start = time.time()
        await tab.go_to('https://example.com')
        interactive_time = time.time() - start
        print(f"INTERACTIVE 模式: {interactive_time:.2f}s")

asyncio.run(compare_load_states())
```

!!! tip "何时使用 INTERACTIVE"
    在以下情况使用 `INTERACTIVE`：
    
    - 只需要访问 DOM，不需要图像/字体
    - 抓取文本内容和结构
    - 速度至关重要
    - 页面有许多加载缓慢的资源
    
    在以下情况坚持使用 `COMPLETE`（默认）：
    
    - 截图（需要加载图像）
    - 等待 JavaScript 重型应用完全初始化
    - 测试页面加载性能

## 命令行参数参考

Chromium 支持数百个命令行开关。以下是自动化最有用的参数，按类别组织。

!!! info "完整参考"
    所有 Chromium 开关的完整列表：[Peter Beverloo 的 Chromium 命令行开关](https://peter.sh/experiments/chromium-command-line-switches/)

### 性能和资源管理

优化浏览器性能以加快自动化：

```python
options = ChromiumOptions()

# 禁用 GPU 加速（无头、Docker、CI/CD）
options.add_argument('--disable-gpu')
options.add_argument('--disable-software-rasterizer')

# 减少内存使用
options.add_argument('--disable-dev-shm-usage')  # Docker：克服 /dev/shm 大小限制
options.add_argument('--disable-extensions')
options.add_argument('--disable-background-networking')

# 禁用不必要的功能
options.add_argument('--disable-sync')  # Google 账户同步
options.add_argument('--disable-translate')
options.add_argument('--disable-background-timer-throttling')
options.add_argument('--disable-backgrounding-occluded-windows')
options.add_argument('--disable-renderer-backgrounding')

# 网络优化
options.add_argument('--disable-features=NetworkPrediction')
options.add_argument('--dns-prefetch-disable')

# 窗口和渲染
options.add_argument('--window-size=1920,1080')
options.add_argument('--window-position=0,0')
options.add_argument('--force-device-scale-factor=1')
```

| 参数 | 效果 | 何时使用 |
|----------|--------|-------------|
| `--disable-gpu` | 无 GPU 加速 | 无头、Docker、没有 GPU 的服务器 |
| `--disable-dev-shm-usage` | 使用 `/tmp` 而不是 `/dev/shm` | 共享内存小的 Docker 容器 |
| `--disable-extensions` | 不加载任何扩展 | 用于自动化的干净、快速的浏览器 |
| `--window-size=W,H` | 设置初始窗口尺寸 | 截图、一致的视口 |
| `--force-device-scale-factor=1` | 禁用高 DPI 缩放 | 跨系统一致渲染 |

### 隐蔽和指纹识别

使用这些命令行参数使您的自动化更难被检测：

| 参数 | 目的 | 示例 |
|----------|---------|---------|
| `--disable-blink-features=AutomationControlled` | 删除 `navigator.webdriver` 标志 | 隐蔽性必不可少 |
| `--user-agent=...` | 设置真实、常见的用户代理 | 匹配目标区域/设备 |
| `--use-gl=swiftshader` | 软件 WebGL 渲染器 | 避免独特的 GPU 指纹 |
| `--force-webrtc-ip-handling-policy=...` | 防止 WebRTC IP 泄露 | 使用 `disable_non_proxied_udp` |
| `--lang=en-US` | 设置浏览器语言 | 匹配目标区域 |
| `--accept-lang=en-US,en;q=0.9` | Accept-Language 标头 | 真实的语言偏好 |
| `--tz=America/New_York` | 设置时区 | 匹配目标区域 |
| `--no-first-run` | 跳过首次运行向导 | 更干净的自动化 |
| `--no-default-browser-check` | 跳过默认浏览器提示 | 避免 UI 中断 |
| `--disable-reading-from-canvas` | Canvas 指纹识别缓解 | 减少独特性 |
| `--disable-features=AudioServiceOutOfProcess` | 音频指纹识别缓解 | 减少独特性 |

!!! warning "检测军备竞赛"
    没有单一技术能保证不可检测性。结合多种策略：
    
    1. **命令行参数**（此表）
    2. **浏览器偏好设置** - [浏览器偏好设置 - 隐蔽和指纹识别](browser-preferences.md#stealth-fingerprinting)
    3. **类人交互** - [类人交互](../automation/human-interactions.md)
    4. **良好的 IP 声誉** - 使用历史干净的住宅代理

### 安全和隐私

控制安全功能和隐私设置：

```python
options = ChromiumOptions()

# 沙箱（仅在 Docker/CI 中禁用）
options.add_argument('--no-sandbox')  # 安全风险 - 仅在受控环境中使用
options.add_argument('--disable-setuid-sandbox')

# HTTPS/SSL
options.add_argument('--ignore-certificate-errors')  # 忽略 SSL 错误
options.add_argument('--ignore-ssl-errors')
options.add_argument('--allow-insecure-localhost')

# 隐私
options.add_argument('--disable-features=Translate')
options.add_argument('--disable-sync')
options.add_argument('--incognito')  # 在隐身模式下打开

# 权限自动授予（用于测试）
options.add_argument('--use-fake-ui-for-media-stream')  # 自动授予摄像头/麦克风
options.add_argument('--use-fake-device-for-media-stream')  # 使用假设备
```

!!! danger "沙箱警告"
    **`--no-sandbox` 是安全风险！** 仅在以下情况使用：
    
    - 在 Docker 容器中运行（沙箱与容器隔离冲突）
    - 具有受限权限的 CI/CD 环境
    - 您完全信任正在加载的内容
    
    **永远不要**在以下情况使用 `--no-sandbox`：
    
    - 访问不受信任的网站
    - 运行用户提交的代码
    - 在具有外部输入的生产环境中

| 参数 | 效果 | 安全影响 |
|----------|--------|-----------------|
| `--no-sandbox` | 禁用 Chrome 沙箱 | **高风险** - 允许代码执行 |
| `--ignore-certificate-errors` | 跳过 SSL 验证 | **中等风险** - 可能发生 MITM 攻击 |
| `--incognito` | 隐私浏览模式 | 更安全 - 没有持久状态 |

### 调试和开发

用于调试自动化和开发的工具：

```python
options = ChromiumOptions()

# DevTools
options.add_argument('--auto-open-devtools-for-tabs')

# 日志记录
options.add_argument('--enable-logging')
options.add_argument('--v=1')  # 详细级别（0-3）
options.add_argument('--log-level=0')  # 0=INFO, 1=WARNING, 2=ERROR

# 崩溃处理
options.add_argument('--disable-crash-reporter')
options.add_argument('--no-crash-upload')

# 启用实验性功能
options.add_argument('--enable-features=NetworkService,NetworkServiceInProcess')
options.add_argument('--enable-experimental-web-platform-features')

# JavaScript 调试
options.add_argument('--js-flags=--expose-gc')  # 公开垃圾收集器
```

!!! tip "远程调试"
    Pydoll 自动管理远程调试端口。要访问 Chrome DevTools：
    
    ```python
    async with Chrome() as browser:
        tab = await browser.start()
        
        # 获取调试端口
        port = browser._connection_port
        print(f"DevTools 可用于: http://localhost:{port}")
        
        # 在浏览器中打开此 URL 以访问 DevTools
    ```
    
    **不要**使用 `--remote-debugging-port` 参数 - 它会与 Pydoll 的内部管理冲突！

### 显示和渲染

控制浏览器如何渲染内容：

```python
options = ChromiumOptions()

# 视口和窗口
options.add_argument('--window-size=1920,1080')
options.add_argument('--window-position=0,0')
options.add_argument('--start-maximized')
options.add_argument('--start-fullscreen')

# 高 DPI 显示器
options.add_argument('--force-device-scale-factor=1')
options.add_argument('--high-dpi-support=1')

# 颜色和渲染
options.add_argument('--force-color-profile=srgb')
options.add_argument('--disable-accelerated-2d-canvas')
options.add_argument('--disable-accelerated-video-decode')

# 字体渲染
options.add_argument('--font-render-hinting=none')
options.add_argument('--disable-font-subpixel-positioning')

# 动画
options.add_argument('--disable-animations')
options.add_argument('--wm-window-animations-disabled')
```

| 参数 | 效果 | 用例 |
|----------|--------|----------|
| `--window-size=W,H` | 设置窗口尺寸 | 截图、一致的视口 |
| `--start-maximized` | 打开最大化窗口 | UI 测试、全屏捕获 |
| `--force-device-scale-factor=1` | 禁用 DPI 缩放 | 跨系统一致渲染 |
| `--disable-animations` | 无 CSS/UI 动画 | 更快的测试、减少不稳定 |

### 代理配置

为所有网络流量配置代理：

```python
options = ChromiumOptions()

# HTTP/HTTPS 代理
options.add_argument('--proxy-server=http://proxy.example.com:8080')

# 认证代理
options.add_argument('--proxy-server=http://user:pass@proxy.example.com:8080')

# SOCKS 代理
options.add_argument('--proxy-server=socks5://proxy.example.com:1080')

# 为特定主机绕过代理
options.add_argument('--proxy-bypass-list=localhost,127.0.0.1,*.local')

# 代理自动配置（PAC）文件
options.add_argument('--proxy-pac-url=http://proxy.example.com/proxy.pac')
```

!!! info "代理身份验证"
    对于需要身份验证的代理，当使用带凭据的 `--proxy-server` 参数时，Pydoll 会自动处理身份验证挑战。
    
    请参阅 **[请求拦截](../network/interception.md)** 了解 Fetch 域与代理的交互详情。

## 辅助方法

`ChromiumOptions` 为常见配置任务提供便捷方法：

### 下载管理

```python
options = ChromiumOptions()

# 设置下载目录
options.set_default_download_directory('/home/user/downloads')

# 提示下载位置
options.prompt_for_download = True  # 询问用户保存位置
options.prompt_for_download = False  # 静默下载（默认）

# 允许多个自动下载
options.allow_automatic_downloads = True  # 无需提示即允许
options.allow_automatic_downloads = False  # 阻止或询问（默认）
```

### 内容阻止

```python
options = ChromiumOptions()

# 阻止弹出窗口
options.block_popups = True  # 阻止（在大多数情况下为默认）
options.block_popups = False  # 允许

# 阻止通知
options.block_notifications = True  # 阻止请求
options.block_notifications = False  # 允许网站询问
```

### 隐私控制

```python
options = ChromiumOptions()

# 密码管理器
options.password_manager_enabled = False  # 禁用保存密码提示
options.password_manager_enabled = True  # 启用（默认）

# WebRTC 泄露保护（防止通过 WebRTC 暴露真实 IP）
options.webrtc_leak_protection = True  # 添加 --force-webrtc-ip-handling-policy=disable_non_proxied_udp
options.webrtc_leak_protection = False  # 禁用（默认）
```

!!! tip "WebRTC 泄露保护"
    即使使用代理，WebRTC 也可能泄露您的真实 IP 地址。启用 `webrtc_leak_protection` 以阻止非代理的 UDP 连接，防止 STUN 请求绕过您的代理。在使用代理进行匿名时，这是**必不可少的**。详见 **[网络基础 - WebRTC](../../deep-dive/network/network-fundamentals.md#webrtc-和-ip-泄露)** 了解详情。

### 文件处理

```python
options = ChromiumOptions()

# PDF 行为
options.open_pdf_externally = True  # 下载 PDF 而不是查看
options.open_pdf_externally = False  # 在浏览器中查看（默认）
```

### 国际化

```python
options = ChromiumOptions()

# 接受语言（影响 Content-Language 标头）
options.set_accept_languages('en-US,en;q=0.9,pt-BR;q=0.8')
```

## 完整配置示例

### 快速抓取配置

针对速度和资源效率进行优化：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions
from pydoll.constants import PageLoadState

def create_fast_scraping_options() -> ChromiumOptions:
    """用于 Web 抓取的超快配置。"""
    options = ChromiumOptions()
    
    # 无头模式以提高速度
    options.headless = True
    
    # 更快的页面加载（DOM 就绪足以进行抓取）
    options.page_load_state = PageLoadState.INTERACTIVE
    
    # 禁用不必要的功能
    options.add_argument('--disable-extensions')
    options.add_argument('--disable-gpu')
    options.add_argument('--disable-dev-shm-usage')
    options.add_argument('--disable-background-networking')
    options.add_argument('--disable-sync')
    options.add_argument('--disable-translate')
    
    # 阻止减慢加载速度的内容
    options.block_notifications = True
    options.block_popups = True
    
    # 禁用图像以实现更快的加载（如果不需要）
    options.add_argument('--blink-settings=imagesEnabled=false')
    
    # 网络优化
    options.add_argument('--disable-features=NetworkPrediction')
    options.add_argument('--dns-prefetch-disable')
    
    return options

async def fast_scraping_example():
    options = create_fast_scraping_options()
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # 极快的导航和抓取
        urls = ['https://example.com', 'https://example.org', 'https://example.net']
        
        for url in urls:
            await tab.go_to(url)
            title = await tab.execute_script('return document.title')
            print(f"{url}: {title}")

asyncio.run(fast_scraping_example())
```

### 完整隐蔽配置

为了最大的不可检测性，将命令行参数与浏览器偏好设置相结合：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

def create_full_stealth_options() -> ChromiumOptions:
    """结合参数和偏好设置的完整隐蔽配置。"""
    options = ChromiumOptions()
    
    # ===== 命令行参数 =====
    
    # 核心隐蔽
    options.add_argument('--disable-blink-features=AutomationControlled')
    options.add_argument('--disable-features=IsolateOrigins,site-per-process')
    
    # 用户代理（使用最新的、常见的）
    options.add_argument('--user-agent=Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/130.0.0.0 Safari/537.36')
    
    # 语言和区域
    options.add_argument('--lang=en-US')
    options.add_argument('--accept-lang=en-US,en;q=0.9')
    
    # WebGL（软件渲染器以避免独特的 GPU 签名）
    options.add_argument('--use-gl=swiftshader')
    options.add_argument('--disable-features=WebGLDraftExtensions')
    
    # WebRTC IP 泄露防护
    options.webrtc_leak_protection = True

    # 权限和首次运行
    options.add_argument('--no-first-run')
    options.add_argument('--no-default-browser-check')
    
    # 窗口大小（常见分辨率）
    options.add_argument('--window-size=1920,1080')
    
    # ===== 浏览器偏好设置 =====
    # 有关全面的浏览器偏好设置配置，请参阅：
    # https://pydoll.tech/docs/features/configuration/browser-preferences/#stealth-fingerprinting
    
    return options

async def stealth_automation_example():
    options = create_full_stealth_options()
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # 在机器人检测网站上测试
        await tab.go_to('https://bot.sannysoft.com')
        await asyncio.sleep(5)
        
        # 您的自动化在这里...

asyncio.run(stealth_automation_example())
```

!!! warning "用户代理一致性至关重要"
    设置 `--user-agent` 只会更改 **HTTP 标头**，但检测系统还会检查 `navigator.userAgent`、`navigator.platform`、`navigator.vendor` 和其他 JavaScript 属性。**这些值之间的不一致是强烈的机器人指标。**
    
    例如，如果您的 HTTP User-Agent 说"Windows"但 `navigator.platform` 说"Linux"，您将立即被标记。
    
    **解决方案**：您还必须通过 CDP 覆盖 JavaScript 属性以保持一致性。请参阅 **[浏览器指纹识别 - 用户代理一致性](../../deep-dive/fingerprinting/browser-fingerprinting.md#user-agent-consistency)** 获取详细说明和使用 `Page.addScriptToEvaluateOnNewDocument` 的实现。
    
    这就是为什么全面的隐蔽需要命令行参数**和**浏览器偏好设置配置。

!!! tip "完整隐蔽策略"
    命令行参数只是解决方案的一部分。为了最大的隐蔽性：
    
    1. **使用上述参数**（navigator.webdriver、WebGL、WebRTC）
    2. **配置浏览器偏好设置** - 请参阅[浏览器偏好设置 - 隐蔽和指纹识别](browser-preferences.md#stealth-fingerprinting)
    3. **类人交互** - 请参阅[类人交互](../automation/human-interactions.md)
    4. **良好的代理/IP 声誉** - 使用住宅代理

### Docker/CI 配置

用于容器化环境：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions
from pydoll.constants import PageLoadState

def create_docker_options() -> ChromiumOptions:
    """用于 Docker 容器和 CI/CD 的配置。"""
    options = ChromiumOptions()
    
    # Docker 所需
    options.headless = True
    options.add_argument('--no-sandbox')  # 沙箱与容器隔离冲突
    options.add_argument('--disable-dev-shm-usage')  # 克服 /dev/shm 大小限制
    
    # 稳定性
    options.add_argument('--disable-gpu')
    options.add_argument('--disable-software-rasterizer')
    
    # 内存优化
    options.add_argument('--disable-extensions')
    options.add_argument('--disable-background-networking')
    
    # 为 CI 更快的页面加载
    options.page_load_state = PageLoadState.INTERACTIVE
    
    # 为慢速 CI 运行器增加超时
    options.start_timeout = 20
    
    # 崩溃处理
    options.add_argument('--disable-crash-reporter')
    
    return options

async def ci_testing_example():
    options = create_docker_options()
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # 运行您的测试...
        await tab.go_to('https://example.com')
        assert await tab.execute_script('return document.title') == 'Example Domain'

asyncio.run(ci_testing_example())
```

## 故障排除

### 浏览器无法启动

```python
# 增加超时
options.start_timeout = 30

# 检查二进制位置
options.binary_location = '/path/to/chrome'

# Docker/CI 问题
options.add_argument('--no-sandbox')
options.add_argument('--disable-dev-shm-usage')
```

### 性能慢

```python
# 如果不需要则禁用 GPU
options.add_argument('--disable-gpu')

# 禁用图像
options.add_argument('--blink-settings=imagesEnabled=false')

# 使用 INTERACTIVE 加载状态
options.page_load_state = PageLoadState.INTERACTIVE

# 禁用不必要的功能
options.add_argument('--disable-extensions')
options.add_argument('--disable-background-networking')
```

### Docker 中的内存问题

```python
# Docker 必需
options.add_argument('--disable-dev-shm-usage')

# 减少内存占用
options.add_argument('--disable-extensions')
options.add_argument('--disable-gpu')
options.add_argument('--single-process')  # 最后手段（可能不稳定）
```

## 进一步阅读

- **[浏览器偏好设置](browser-preferences.md)** - Chromium 的内部偏好系统
- **[隐蔽自动化](../automation/human-interactions.md)** - 类人交互
- **[上下文](../browser-management/contexts.md)** - 隔离的浏览上下文
- **[网络拦截](../network/interception.md)** - 请求/响应操作

!!! tip "实验是关键"
    浏览器配置高度依赖于您的具体用例。从这里的示例开始，然后根据您的需求进行调整。使用 `browser._connection_port` 访问 DevTools 并检查浏览器内部发生的情况。


================================================
FILE: docs/zh/features/configuration/browser-preferences.md
================================================
# 自定义浏览器首选项

Pydoll 最强大的功能之一是直接访问 Chromium 的内部首选项系统。与传统的浏览器自动化工具只公开有限的选项不同，Pydoll 为您提供与扩展程序和企业管理员相同级别的控制权，允许您配置 Chromium 源代码中提供的**任何**浏览器设置。

## 为什么浏览器首选项很重要

浏览器首选项控制 Chromium 行为的方方面面：

- **性能**：禁用不需要的功能以加快页面加载速度
- **隐私**：控制浏览器收集和发送的数据
- **自动化**：删除破坏工作流程的用户提示和确认
- **隐身**：创建逼真的浏览器指纹以避免检测
- **企业**：应用通常只能通过组策略获得的策略

!!! info "直接访问的力量"
    大多数自动化工具只公开 10-20 个常见设置。Pydoll 为您提供**数百个**首选项的访问权限，从下载行为到搜索建议，从网络预测到插件管理。如果 Chromium 可以做到，您就可以配置它。

## 快速开始

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def preferences_example():
    options = ChromiumOptions()
    
    # 使用字典设置首选项
    options.browser_preferences = {
        'download': {
            'default_directory': '/tmp/downloads',
            'prompt_for_download': False
        },
        'profile': {
            'default_content_setting_values': {
                'notifications': 2  # 阻止通知
            }
        }
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # 下载自动保存到 /tmp/downloads
        # 不会出现通知提示

asyncio.run(preferences_example())
```

## 了解浏览器首选项

### 什么是首选项？

Chromium 将所有用户可配置的设置存储在一个名为 `Preferences` 的 JSON 文件中，该文件位于浏览器的用户数据目录中。此文件包含**所有内容**，从您的主页 URL 到图像是否自动加载。

**典型位置：**

- **Linux**: `~/.config/google-chrome/Default/Preferences`
- **macOS**: `~/Library/Application Support/Google/Chrome/Default/Preferences`
- **Windows**: `%LOCALAPPDATA%\Google\Chrome\User Data\Default\Preferences`

### 首选项文件结构

首选项文件是一个嵌套的 JSON 对象：

```json
{
  "download": {
    "default_directory": "/home/user/Downloads",
    "prompt_for_download": true
  },
  "profile": {
    "default_content_setting_values": {
      "notifications": 1,
      "popups": 0
    },
    "password_manager_enabled": true
  },
  "search": {
    "suggest_enabled": true
  },
  "net": {
    "network_prediction_options": 1
  }
}
```

Chromium 源代码中的每个点分隔的首选项名称都映射到嵌套的 JSON 路径：

- `download.default_directory` → `{'download': {'default_directory': ...}}`
- `profile.password_manager_enabled` → `{'profile': {'password_manager_enabled': ...}}`

### Chromium 如何使用首选项

当 Chromium 启动时：

1. **读取**磁盘上的首选项文件
2. **应用**这些设置来配置浏览器行为
3. **更新**用户通过 UI 更改设置时的文件
4. **回退**到默认值（如果缺少首选项）

Pydoll 通过在浏览器启动前预填充首选项文件来拦截步骤 1，确保您的自定义设置从第一次页面加载开始就被应用。

## 在 Pydoll 中的工作原理

### 设置首选项

使用 `browser_preferences` 属性设置任何首选项：

```python
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()

# 直接赋值 - 与现有首选项合并
options.browser_preferences = {
    'download': {'default_directory': '/tmp'},
    'intl': {'accept_languages': 'pt-BR,en-US'}
}

# 多次赋值会合并，而不是替换
options.browser_preferences = {
    'profile': {'password_manager_enabled': False}
}

# 现在两组首选项都处于活动状态
```

!!! warning "首选项是合并的，而不是替换的"
    当您多次设置 `browser_preferences` 时，新首选项会与现有首选项**合并**。只有您设置的特定键会被更新；其他所有内容都会保留。
    
    ```python
    options.browser_preferences = {'download': {'prompt': False}}
    options.browser_preferences = {'profile': {'password_manager_enabled': False}}
    
    # 结果：两个首选项都已设置
    # {'download': {'prompt': False}, 'profile': {'password_manager_enabled': False}}
    ```

### 嵌套路径语法

首选项使用嵌套字典，镜像 Chromium 的点表示法：

```python
# Chromium 源代码常量：
# const char kDownloadDefaultDirectory[] = "download.default_directory";

# 转换为 Python 字典：
options.browser_preferences = {
    'download': {
        'default_directory': '/path/to/downloads'
    }
}
```

嵌套越深，首选项越具体：

```python
# 顶层：profile
# 第二层：default_content_setting_values  
# 第三层：notifications

options.browser_preferences = {
    'profile': {
        'default_content_setting_values': {
            'notifications': 2,  # 阻止
            'geolocation': 2,    # 阻止
            'media_stream': 2    # 阻止
        }
    }
}
```

## 实际用例

### 1. 性能优化

禁用资源密集型功能以实现更快的自动化：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def performance_optimized_browser():
    options = ChromiumOptions()
    options.browser_preferences = {
        # 禁用网络预测和预取
        'net': {
            'network_prediction_options': 2  # 2 = 从不预测
        },
        # 禁用图像加载
        'profile': {
            'default_content_setting_values': {
                'images': 2  # 2 = 阻止，1 = 允许
            }
        },
        # 禁用插件
        'webkit': {
            'webprefs': {
                'plugins_enabled': False
            }
        },
        # 禁用拼写检查
        'browser': {
            'enable_spellchecking': False
        }
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # 在没有图像和不必要功能的情况下，页面加载速度提高 3-5 倍
        await tab.go_to('https://example.com')
        print("快速加载完成！")

asyncio.run(performance_optimized_browser())
```

!!! tip "性能影响"
    仅禁用图像就可以将图像密集型网站的页面加载时间减少 50-70%。结合禁用预取、拼写检查和插件，可实现最大速度。

### 2. 隐私与反跟踪

创建注重隐私的浏览器配置：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def privacy_focused_browser():
    options = ChromiumOptions()
    options.browser_preferences = {
        # 启用请勿跟踪
        'enable_do_not_track': True,
        
        # 禁用引荐来源
        'enable_referrers': False,
        
        # 禁用安全浏览（将 URL 发送到 Google）
        'safebrowsing': {
            'enabled': False
        },
        
        # 禁用密码管理器
        'profile': {
            'password_manager_enabled': False
        },
        
        # 禁用自动填充
        'autofill': {
            'enabled': False,
            'profile_enabled': False
        },
        
        # 禁用搜索建议（将查询发送到搜索引擎）
        'search': {
            'suggest_enabled': False
        },
        
        # 禁用遥测和指标
        'user_experience_metrics': {
            'reporting_enabled': False
        },
        
        # 阻止第三方 cookie
        'profile': {
            'block_third_party_cookies': True,
            'cookie_controls_mode': 1
        }
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        print("注重隐私的浏览器已准备就绪！")

asyncio.run(privacy_focused_browser())
```

### 3. 静默下载

自动化文件下载，无需用户交互：

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def silent_download_automation():
    download_dir = Path.home() / 'automation_downloads'
    download_dir.mkdir(exist_ok=True)
    
    options = ChromiumOptions()
    options.browser_preferences = {
        'download': {
            'default_directory': str(download_dir),
            'prompt_for_download': False,
            'directory_upgrade': True
        },
        'profile': {
            'default_content_setting_values': {
                'automatic_downloads': 1  # 1 = 允许，2 = 阻止
            }
        },
        # 始终下载 PDF 而不是在查看器中打开
        'plugins': {
            'always_open_pdf_externally': True
        }
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/downloads')
        
        # 点击下载链接 - 文件自动保存
        download_link = await tab.find(text='Download Report')
        await download_link.click()
        
        await asyncio.sleep(3)
        print(f"文件已下载到：{download_dir}")

asyncio.run(silent_download_automation())
```

### 4. 阻止侵入性 UI 元素

删除破坏自动化的弹出窗口、通知和提示：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def clean_ui_browser():
    options = ChromiumOptions()
    options.browser_preferences = {
        'profile': {
            'default_content_setting_values': {
                'notifications': 2,      # 阻止通知
                'popups': 0,             # 阻止弹出窗口
                'geolocation': 2,        # 阻止位置请求
                'media_stream': 2,       # 阻止摄像头/麦克风访问
                'media_stream_mic': 2,   # 阻止麦克风
                'media_stream_camera': 2 # 阻止摄像头
            }
        },
        # 禁用翻译提示
        'translate': {
            'enabled': False
        },
        # 禁用保存密码提示
        'credentials_enable_service': False,
        
        # 禁用"Chrome 正在被自动化软件控制"信息栏
        'devtools': {
            'preferences': {
                'currentDockState': '"undocked"'
            }
        }
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        # 没有弹出窗口，没有提示，干净的自动化！

asyncio.run(clean_ui_browser())
```

### 5. 国际化与本地化

配置语言和区域设置首选项：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def localized_browser():
    options = ChromiumOptions()
    options.browser_preferences = {
        # 接受语言（优先顺序）
        'intl': {
            'accept_languages': 'pt-BR,pt,en-US,en'
        },
        
        # 拼写检查语言
        'spellcheck': {
            'dictionaries': ['pt-BR', 'en-US']
        },
        
        # 翻译设置
        'translate': {
            'enabled': True
        },
        'translate_blocked_languages': ['en'],  # 不提供翻译英语
        
        # 默认字符编码
        'default_charset': 'UTF-8'
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        # 为巴西葡萄牙语配置的浏览器

asyncio.run(localized_browser())
```

## 辅助方法

对于常见场景，Pydoll 提供便利方法：

```python
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()

# 下载管理
options.set_default_download_directory('/tmp/downloads')
options.prompt_for_download = False
options.allow_automatic_downloads = True
options.open_pdf_externally = True

# 内容阻止
options.block_notifications = True
options.block_popups = True

# 隐私
options.password_manager_enabled = False

# 国际化
options.set_accept_languages('pt-BR,en-US,en')
```

这些方法是为您设置正确嵌套首选项的快捷方式：

```python
# 这个辅助方法：
options.set_default_download_directory('/tmp')

# 等同于：
options.browser_preferences = {
    'download': {
        'default_directory': '/tmp'
    }
}
```

!!! tip "将辅助方法与直接首选项结合使用"
    使用辅助方法处理常见设置，使用 `browser_preferences` 处理高级配置：
    
    ```python
    # 从辅助方法开始
    options.block_notifications = True
    options.prompt_for_download = False
    
    # 添加高级首选项
    options.browser_preferences = {
        'net': {'network_prediction_options': 2},
        'webkit': {'webprefs': {'plugins_enabled': False}}
    }
    ```

## 在 Chromium 源代码中查找首选项

### 源代码参考

Chromium 在 `pref_names.cc` 中定义所有首选项常量：

**官方源代码**：[chromium/src/+/main/chrome/common/pref_names.cc](https://chromium.googlesource.com/chromium/src/+/main/chrome/common/pref_names.cc)

### 阅读源代码

首选项常量使用点表示法，直接映射到嵌套字典：

```cpp
// 来自 Chromium 源代码 (pref_names.cc)：
const char kDownloadDefaultDirectory[] = "download.default_directory";
const char kPromptForDownload[] = "download.prompt_for_download";
const char kSafeBrowsingEnabled[] = "safebrowsing.enabled";
const char kBlockThirdPartyCookies[] = "profile.block_third_party_cookies";
```

**转换为 Python：**

```python
options.browser_preferences = {
    'download': {
        'default_directory': '/path/to/dir',
        'prompt_for_download': False
    },
    'safebrowsing': {
        'enabled': False
    },
    'profile': {
        'block_third_party_cookies': True
    }
}
```

### 发现过程

1. **搜索源代码**：访问 [pref_names.cc](https://chromium.googlesource.com/chromium/src/+/main/chrome/common/pref_names.cc)
2. **找到您的首选项**：搜索关键字（例如 "download"、"password"、"notification"）
3. **记录常量名称**：例如 `kDownloadDefaultDirectory[] = "download.default_directory"`
4. **转换为字典**：按点分割并创建嵌套结构

**示例 - 查找通知首选项：**

```cpp
// 在 pref_names.cc 中搜索 "notification"：
const char kPushMessagingAppIdentifierMap[] = 
    "gcm.push_messaging_application_id_map";
const char kDefaultNotificationsSetting[] = 
    "profile.default_content_setting_values.notifications";
```

```python
# 变成：
options.browser_preferences = {
    'profile': {
        'default_content_setting_values': {
            'notifications': 2  # 2 = 阻止，1 = 允许，0 = 询问
        }
    }
}
```

### 常见首选项模式

| 类别 | 示例常量 | Python 字典路径 |
|----------|-----------------|------------------|
| 下载 | `download.default_directory` | `{'download': {'default_directory': ...}}` |
| 内容设置 | `profile.default_content_setting_values.X` | `{'profile': {'default_content_setting_values': {'X': ...}}}` |
| 网络 | `net.network_prediction_options` | `{'net': {'network_prediction_options': ...}}` |
| 隐私 | `safebrowsing.enabled` | `{'safebrowsing': {'enabled': ...}}` |
| 会话 | `session.restore_on_startup` | `{'session': {'restore_on_startup': ...}}` |

!!! warning "未记录的首选项"
    并非所有首选项都有文档。有些是：
    
    - **实验性**：可能在未来的 Chromium 版本中更改或删除
    - **内部**：由 Chromium 的内部系统使用
    - **平台特定**：仅在某些操作系统上工作
    
    在依赖未记录的首选项之前，请彻底测试。

## 有用的首选项参考

以下是从 Chromium 的 `pref_names.cc` 中精选的有趣且有用的首选项列表：

### 内容与媒体设置

```python
options.browser_preferences = {
    'profile': {
        'default_content_setting_values': {
            # 内容控制 (0=询问，1=允许，2=阻止)
            'cookies': 1,                    # 允许 cookie
            'images': 1,                     # 允许图像（2 为阻止）
            'javascript': 1,                 # 允许 JavaScript（2 为阻止）
            'plugins': 2,                    # 阻止插件（Flash 等）
            'popups': 0,                     # 阻止弹出窗口
            'geolocation': 2,                # 阻止位置请求
            'notifications': 2,              # 阻止通知
            'media_stream': 2,               # 阻止摄像头/麦克风
            'media_stream_mic': 2,           # 仅阻止麦克风
            'media_stream_camera': 2,        # 仅阻止摄像头
            'automatic_downloads': 1,        # 允许自动下载
            'midi_sysex': 2,                 # 阻止 MIDI 访问
            'clipboard': 1,                  # 允许剪贴板访问
            'sensors': 2,                    # 阻止运动传感器
            'usb_guard': 2,                  # 阻止 USB 设备访问
            'serial_guard': 2,               # 阻止串行端口访问
            'bluetooth_guard': 2,            # 阻止蓝牙
            'file_system_write_guard': 2,    # 阻止文件系统写入
        }
    }
}
```

### 网络与性能

```python
options.browser_preferences = {
    'net': {
        # 网络预测：0=始终，1=仅 WiFi，2=从不
        'network_prediction_options': 2,
        
        # 快速检查服务器可达性
        'quick_check_enabled': False
    },
    
    # DNS 预取
    'dns_prefetching': {
        'enabled': False  # 禁用以减少网络流量
    },
    
    # 预连接到搜索结果
    'search': {
        'suggest_enabled': False,           # 禁用搜索建议
        'instant_enabled': False            # 禁用即时结果
    },
    
    # 备用错误页面
    'alternate_error_pages': {
        'enabled': False  # 不建议 404 的替代方案
    }
}
```

### 下载首选项

```python
options.browser_preferences = {
    'download': {
        'default_directory': '/path/to/downloads',
        'prompt_for_download': False,
        'directory_upgrade': True,
        'extensions_to_open': '',           # 自动打开的文件类型
        'open_pdf_externally': True,        # 不使用内部 PDF 查看器
    },
    
    'download_bubble': {
        'partial_view_enabled': True        # 显示下载进度气泡
    },
    
    'safebrowsing': {
        'enabled': False  # 禁用安全浏览下载警告
    }
}
```

### 隐私与安全

```python
options.browser_preferences = {
    # 请勿跟踪
    'enable_do_not_track': True,
    
    # 引荐来源
    'enable_referrers': False,
    
    # 安全浏览
    'safebrowsing': {
        'enabled': False,                   # 禁用安全浏览
        'enhanced': False                   # 禁用增强保护
    },
    
    # 隐私沙盒（Google 的 cookie 替代品）
    'privacy_sandbox': {
        'apis_enabled': False,
        'topics_enabled': False,
        'fledge_enabled': False
    },
    
    # 第三方 cookie
    'profile': {
        'block_third_party_cookies': True,
        'cookie_controls_mode': 1,          # 在隐身模式下阻止第三方
        
        # 内容设置
        'default_content_setting_values': {
            'cookies': 1,
            'third_party_cookie_blocking_enabled': True
        }
    },
    
    # WebRTC（可能泄露真实 IP）
    'webrtc': {
        'ip_handling_policy': 'default_public_interface_only',
        'multiple_routes_enabled': False,
        'nonproxied_udp_enabled': False
    }
}
```

### 自动填充与密码

```python
options.browser_preferences = {
    'autofill': {
        'enabled': False,                   # 禁用表单自动填充
        'profile_enabled': False,           # 禁用地址自动填充
        'credit_card_enabled': False,       # 禁用信用卡自动填充
        'credit_card_fido_auth_enabled': False
    },
    
    'profile': {
        'password_manager_enabled': False,
        'password_manager_leak_detection': False
    },
    
    'credentials_enable_service': False,
    'credentials_enable_autosignin': False
}
```

### 浏览器行为与 UI

```python
import time

options.browser_preferences = {
    # 主页和启动
    'homepage': 'https://www.google.com',
    'homepage_is_newtabpage': False,
    'newtab_page_location_override': 'https://www.google.com',
    
    'session': {
        'restore_on_startup': 1,            # 0=新标签页，1=恢复，4=特定 URL，5=新标签页
        'startup_urls': ['https://www.google.com'],
        'session_data_status': 3            # 会话数据状态（内部）
    },
    
    # 欢迎页面和窗口
    'browser': {
        'has_seen_welcome_page': True,      # 跳过欢迎屏幕
        'window_placement': {
            'bottom': 1032,                 # 窗口底部位置
            'left': 2247,                   # 窗口左侧位置
            'right': 3192,                  # 窗口右侧位置
            'top': 31,                      # 窗口顶部位置
            'maximized': False,             # 窗口最大化
            'work_area_bottom': 1080,       # 屏幕工作区底部
            'work_area_left': 1920,         # 屏幕工作区左侧
            'work_area_right': 3840,        # 屏幕工作区右侧
            'work_area_top': 0              # 屏幕工作区顶部
        }
    },
    
    # 扩展
    'extensions': {
        'ui': {
            'developer_mode': False
        },
        'alerts': {
            'initialized': True
        },
        'theme': {
            'system_theme': 2               # 0=默认，1=浅色，2=深色
        },
        'last_chrome_version': '130.0.6723.91'  # 必须与您的版本匹配
    },
    
    # 翻译
    'translate': {
        'enabled': False                    # 禁用翻译提示
    },
    'translate_blocked_languages': ['en'],  # 从不翻译英语
    'translate_site_blacklist': [],         # 旧版（使用 blocklist_with_time）
    
    # 书签
    'bookmark_bar': {
        'show_on_all_tabs': False
    },
    
    # 标签页
    'tabs': {
        'new_tab_position': 0               # 0=右侧，1=当前之后
    },
    'pinned_tabs': [],                      # 固定标签页 URL 列表
    
    # 新标签页（Chrome 格式的时间戳）
    'NewTabPage': {
        'PrevNavigationTime': str(int(time.time() * 1000000) + 11644473600000000)  # Chrome 时间戳
    },
    'ntp': {
        'num_personal_suggestions': 6       # 建议数量（0-10）
    },
    
    # 工具栏自定义
    'toolbar': {
        'pinned_chrome_labs_migration_complete': True
    }
}
```

!!! info "Chrome 时间戳格式"
    Chrome 使用 Windows FILETIME 格式：自 1601 年 1 月 1 日 UTC 以来的微秒。
    
    转换 Python 时间戳：
    ```python
    import time
    chrome_time = int(time.time() * 1000000) + 11644473600000000
    ```

### 拼写与语言

```python
options.browser_preferences = {
    'browser': {
        'enable_spellchecking': False       # 禁用拼写检查
    },
    
    'spellcheck': {
        'dictionaries': ['en-US', 'pt-BR'], # 拼写检查语言
        'dictionary': '',                   # 旧版首选项（保持为空）
        'use_spelling_service': False       # 不发送到 Google
    },
    
    'intl': {
        'accept_languages': 'pt-BR,pt,en-US,en',
        'selected_languages': 'pt-BR,pt,en-US,en'  # 明确选择的
    },
    
    # 翻译行为和历史
    'translate': {
        'enabled': True
    },
    'translate_accepted_count': {
        'pt-BR': 0,
        'es': 5                             # 接受了 5 次西班牙语翻译
    },
    'translate_denied_count_for_language': {
        'en': 10                            # 从不翻译英语
    },
    'translate_ignored_count_for_language': {
        'en': 1
    },
    'translate_site_blocklist_with_time': {},  # 从不翻译的网站
    
    # 无障碍字幕语言
    'accessibility': {
        'captions': {
            'live_caption_language': 'pt-BR'
        }
    },
    
    # 语言模型计数器（使用统计）
    'language_model_counters': {
        'en': 2,                            # 英语单词计数
        'pt': 10                            # 葡萄牙语单词计数
    }
}
```

!!! info "语言模型计数器"
    这些计数器跟踪 Chrome 机器学习模型的语言使用统计信息：
    
    - 用于预测用户语言偏好
    - 影响搜索建议和自动完成
    - 更高的计数表示更频繁的使用
    - 真实值：偶尔使用 0-1000，大量使用 1000+

### 无障碍

```python
options.browser_preferences = {
    'accessibility': {
        'image_labels_enabled': False       # 不从 Google 获取图像标签
    },
    
    # 字体设置
    'webkit': {
        'webprefs': {
            'default_font_size': 16,
            'default_fixed_font_size': 13,
            'minimum_font_size': 0,
            'minimum_logical_font_size': 6,
            'fonts': {
                'standard': {
                    'Zyyy': 'Arial'
                },
                'serif': {
                    'Zyyy': 'Times New Roman'
                }
            }
        }
    }
}
```

### 媒体与音频

```python
options.browser_preferences = {
    # 音频
    'audio': {
        'mute_enabled': False               # 启动时音频开/关
    },
    
    # 自动播放
    'media': {
        'autoplay_policy': 0,               # 0=允许，1=用户手势，2=文档用户激活
        'video_fullscreen_orientation_lock': False
    },
    
    # WebGL
    'webkit': {
        'webprefs': {
            'webgl_enabled': True,          # 启用/禁用 WebGL
            'webgl2_enabled': True
        }
    }
}
```

### 打印

```python
options.browser_preferences = {
    'printing': {
        'print_preview_sticky_settings': {
            'appState': '{\"version\":2,\"recentDestinations\":[{\"id\":\"Save as PDF\",\"origin\":\"local\"}],\"marginsType\":3,\"customMargins\":{\"marginTop\":63,\"marginRight\":192,\"marginBottom\":240,\"marginLeft\":260}}'
        }
    },
    
    'savefile': {
        'default_directory': '/tmp'         # PDF 的默认保存位置
    }
}
```

!!! tip "打印 appState 格式"
    `appState` 是一个 JSON 编码的字符串。为了更容易操作：
    
    ```python
    import json
    
    app_state = {
        'version': 2,
        'recentDestinations': [{
            'id': 'Save as PDF',
            'origin': 'local'
        }],
        'marginsType': 3,                   # 0=默认，1=无边距，2=最小，3=自定义
        'customMargins': {
            'marginTop': 63,
            'marginRight': 192,
            'marginBottom': 240,
            'marginLeft': 260
        },
        'isHeaderFooterEnabled': False,
        'scaling': '100',
        'scalingType': 3,                   # 0=默认，1=适合页面，2=适合纸张，3=自定义
        'isColorEnabled': True,
        'isDuplexEnabled': False,
        'isCssBackgroundEnabled': True,
        'dpi': {
            'horizontal_dpi': 300,
            'vertical_dpi': 300,
            'is_default': True
        },
        'mediaSize': {
            'name': 'ISO_A4',
            'width_microns': 210000,
            'height_microns': 297000,
            'custom_display_name': 'A4',
            'is_default': True
        }
    }
    
    # 转换为字符串用于 appState
    options.browser_preferences = {
        'printing': {
            'print_preview_sticky_settings': {
                'appState': json.dumps(app_state)
            }
        }
    }
    ```

### WebRTC 与点对点

```python
options.browser_preferences = {
    'webrtc': {
        # IP 处理策略
        'ip_handling_policy': 'default_public_interface_only',
        
        # UDP 传输选项
        'udp_port_range': '10000-10100',    # 限制 UDP 端口范围
        
        # 禁用点对点
        'multiple_routes_enabled': False,
        'nonproxied_udp_enabled': False,
        
        # 文本日志收集
        'text_log_collection_allowed': False
    }
}
```

### 站点隔离与安全

```python
options.browser_preferences = {
    # 站点隔离
    'site_isolation': {
        'isolate_origins': '',              # 要隔离的逗号分隔的源
        'site_per_process': True            # 完整站点隔离
    },
    
    # 混合内容
    'mixed_content': {
        'auto_upgrade_enabled': True        # 将 HTTP 升级到 HTTPS
    },
    
    # SSL/TLS
    'ssl': {
        'rev_checking': {
            'enabled': True                 # 检查证书吊销
        }
    }
}
```

### 安装与国家元数据

```python
import uuid
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.browser_preferences = {
    # 安装时的国家 ID（影响默认设置和语言环境）
    'countryid_at_install': 16978,          # 因国家而异（例如，巴西为 16978）
    
    # 默认应用安装状态
    'default_apps_install_state': 3,        # 0=未安装，1=已安装，3=已迁移
    
    # 企业配置文件 GUID（用于托管浏览器）
    'enterprise_profile_guid': str(uuid.uuid4()),
    
    # 默认搜索提供商
    'default_search_provider': {
        'guid': ''                          # 空表示默认（Google）
    }
}
```

!!! info "国家 ID 值"
    `countryid_at_install` 是一个数字代码，表示首次安装 Chrome 的国家：
    
    - **16978**：巴西 (BR)
    - **16965**：美国 (US)
    - **16967**：英国 (GB)
    - **16966**：德国 (DE)
    - **16972**：日本 (JP)
    - 还有许多其他...
    
    这会影响默认语言、货币和区域设置。为了实现逼真的指纹识别，请将其与目标区域匹配。

### 实验性功能

```python
options.browser_preferences = {
    # Chrome Labs 实验
    'browser': {
        'labs': {
            'enabled': False
        }
    },
    
    # 预加载
    'preload': {
        'enabled': False                    # 禁用页面预加载
    },
    
    # 平滑滚动
    'smooth_scrolling': {
        'enabled': True
    },
    
    # 硬件加速
    'hardware_acceleration_mode': {
        'enabled': True                     # 禁用以提高无头性能
    }
}
```

### DevTools 与开发者选项

```python
options.browser_preferences = {
    'devtools': {
        'preferences': {
            # DevTools 外观
            'currentDockState': '"right"',              # "bottom"、"right"、"undocked"
            'uiTheme': '"dark"',                        # "dark"、"light"、"system"
            
            # 控制台设置
            'consoleTimestampsEnabled': 'true',
            'preserveConsoleLog': 'true',
            
            # 网络面板
            'network.disableCache': 'false',
            'network.color-code-resource-types': 'true',
            'network-panel-split-view-state': '{"vertical":{"size":0}}',
            
            # 源映射
            'cssSourceMapsEnabled': 'true',
            'jsSourceMapsEnabled': 'true',
            
            # 元素面板
            'elements.styles.sidebar.width': '{"vertical":{"size":0,"showMode":"OnlyMain"}}',
            
            # 检查器版本控制
            'inspectorVersion': '37',
            
            # 选定的面板
            'panel-selected-tab': '"network"',          # 最后打开的面板
            
            # 请求信息展开的类别
            'request-info-general-category-expanded': 'true',
            'request-info-request-headers-category-expanded': 'true',
            'request-info-response-headers-category-expanded': 'true'
        },
        'synced_preferences_sync_disabled': {
            'adorner-settings': '[{"adorner":"grid","isEnabled":true},{"adorner":"flex","isEnabled":true}]',
            'syncedInspectorVersion': '37'
        }
    },
    
    # GCM（Google Cloud Messaging）
    'gcm': {
        'product_category_for_subtypes': 'com.chrome.linux'  # com.chrome.windows、com.chrome.macos
    }
}
```

!!! tip "DevTools 首选项格式"
    DevTools 首选项使用独特的格式，其中布尔值和字符串值存储为 **JSON 编码的字符串**（例如 `'true'` 而不是 `True`，`'"dark"'` 而不是 `'dark'`）。这是因为 DevTools 设置直接序列化为 JSON。
    
    对于复杂对象，双重编码：
    ```python
    import json
    
    # 创建对象
    split_view = {'vertical': {'size': 0}}
    
    # 为 DevTools 双重编码
    devtools_value = json.dumps(json.dumps(split_view))
    # 结果：'"{\\"vertical\\":{\\"size\\":0}}"'
    ```

### 同步与登录控制

```python
import time
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.browser_preferences = {
    'signin': {
        'allowed': True,                        # 允许登录 Google
        'cookie_clear_on_exit_migration_notice_complete': True
    },
    
    'sync': {
        'data_type_status_for_sync_to_signin': {
            'bookmarks': False,
            'history': False,
            'passwords': False,
            'preferences': False
        },
        'encryption_bootstrap_token_per_account_migration_done': True,
        'passwords_per_account_pref_migration_done': True,
        'feature_status_for_sync_to_signin': 5
    },
    
    # Google 服务
    'google': {
        'services': {
            'signin_scoped_device_id': '<your-device-id>'  # 生成唯一 ID
        }
    },
    
    # GAIA（Google 帐户基础架构）
    'gaia_cookie': {
        'changed_time': str(int(time.time())),
        'hash': '',
        'last_list_accounts_data': '[]'
    }
}
```

### 优化与性能跟踪

```python
import time
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.browser_preferences = {
    # 优化指南（Google 的性能提示）
    'optimization_guide': {
        'hintsfetcher': {
            'hosts_successfully_fetched': {}
        },
        'predictionmodelfetcher': {
            'last_fetch_attempt': str(int(time.time())),
            'last_fetch_success': str(int(time.time()))
        },
        'previously_registered_optimization_types': {}
    },
    
    # 历史群集（分组相关浏览）
    'history_clusters': {
        'all_cache': {
            'all_keywords': {},
            'all_timestamp': str(int(time.time()))
        },
        'last_selected_tab': 0,
        'short_cache': {
            'short_keywords': {},
            'short_timestamp': '0'
        }
    },
    
    # 域多样性指标
    'domain_diversity': {
        'last_reporting_timestamp': str(int(time.time()))
    },
    
    # 分段平台（用户行为分析）
    'segmentation_platform': {
        'device_switcher_util': {
            'result': {
                'labels': ['NotSynced']
            }
        },
        'last_db_compaction_time': str(int(time.time()))
    },
    
    # 零建议（地址栏预测）
    'zerosuggest': {
        'cachedresults': '',
        'cachedresults_with_url': {}
    }
}
```

!!! info "性能跟踪首选项"
    这些首选项通常由 Chrome 用于跟踪和优化性能。对于自动化，您可以将它们留空或设置真实值以使其看起来更像正常浏览器。

### 会话事件与崩溃处理

Chrome 跟踪会话历史以进行恢复和遥测：

```python
import time
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.browser_preferences = {
    'sessions': {
        'event_log': [
            {
                'crashed': False,
                'time': str(int(time.time() * 1000000) + 11644473600000000),
                'type': 0                   # 0=会话开始
            },
            {
                'crashed': False,
                'did_schedule_command': True,
                'first_session_service': True,
                'tab_count': 1,
                'time': str(int(time.time() * 1000000) + 11644473600000000),
                'type': 2,                  # 2=会话数据已保存
                'window_count': 1
            }
        ],
        'session_data_status': 3            # 0=未知，1=无数据，2=部分数据，3=完整数据
    },
    
    # 配置文件退出类型（对指纹识别很重要）
    'profile': {
        'exit_type': 'Crashed'              # 'Normal'、'Crashed'、'SessionEnded'
    }
}
```

!!! warning "崩溃与正常"
    大多数真实浏览器**偶尔会崩溃**。始终显示 `'Normal'` 退出是可疑的。
    
    **真实策略**：为约 10-20% 的配置文件设置 `'Crashed'` 以模拟正常用户体验。具有讽刺意味的是，偶尔出现"崩溃"会使您的自动化看起来更像人类。

!!! tip "会话事件类型"
    - **类型 0**：会话开始
    - **类型 1**：会话正常结束
    - **类型 2**：会话数据已保存（标签页、窗口）
    - **类型 3**：会话已恢复
    
    `event_log` 会随着时间的推移建立浏览器会话的历史记录。

## 隐身与指纹识别

创建逼真的浏览器指纹对于避免机器人检测系统至关重要。本节涵盖基本和高级技术。

### 快速隐身设置

对于大多数用例，这种简单的配置提供了良好的反检测：

```python
import asyncio
import time
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def quick_stealth():
    options = ChromiumOptions()
    
    # 模拟 60 天前的浏览器
    fake_timestamp = int(time.time()) - (60 * 24 * 60 * 60)
    
    options.browser_preferences = {
        # 虚假使用历史
        'profile': {
            'last_engagement_time': fake_timestamp,
            'exited_cleanly': True,
            'exit_type': 'Normal'
        },
        
        # 真实主页
        'homepage': 'https://www.google.com',
        'session': {
            'restore_on_startup': 1,
            'startup_urls': ['https://www.google.com']
        },
        
        # 启用真实用户拥有的功能
        'enable_do_not_track': False,  # 大多数用户不启用此功能
        'safebrowsing': {'enabled': True},
        'autofill': {'enabled': True},
        'search': {'suggest_enabled': True},
        'dns_prefetching': {'enabled': True}
    }
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://bot-detection-site.com')
        print("隐身模式已激活！")

asyncio.run(quick_stealth())
```

!!! tip "关键隐身原则"
    **启用，而不是禁用**：真实用户启用了安全浏览、自动填充和搜索建议。禁用所有内容看起来可疑。
    
    **老化您的配置文件**：全新安装是一个危险信号。模拟已使用数周或数月的浏览器。
    
    **匹配大多数**：使用 90% 的用户拥有的默认设置，而不是注重隐私的配置。

### 高级指纹识别

为了实现最大的真实性，模拟详细的浏览器使用历史：

```python
import time
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

def create_realistic_browser() -> ChromiumOptions:
    """创建具有全面指纹识别抵抗力的浏览器。"""
    options = ChromiumOptions()
    
    # 时间戳
    current_time = int(time.time())
    install_time = current_time - (90 * 24 * 60 * 60)  # 90 天前
    last_use = current_time - (3 * 60 * 60)            # 3 小时前
    
    options.browser_preferences = {
        # 配置文件元数据（对指纹识别至关重要）
        'profile': {
            'created_by_version': '130.0.6723.91',      # 必须与您的 Chrome 版本匹配
            'creation_time': str(install_time),
            'last_engagement_time': str(last_use),
            'exit_type': 'Crashed',                     # 'Normal'、'Crashed'、'SessionEnded'
            'name': 'Pessoa 1',                         # 真实的配置文件名称
            'avatar_index': 26,                         # 0-26 可用头像
            
            # 真实的内容设置
            'default_content_setting_values': {
                'cookies': 1,
                'images': 1,
                'javascript': 1,
                'popups': 0,
                'notifications': 2,
                'geolocation': 0,           # 询问（不阻止）
                'media_stream': 0           # 询问（真实）
            },
            
            'password_manager_enabled': False,
            'cookie_controls_mode': 0,
            'content_settings': {
                'pref_version': 1,
                'enable_quiet_permission_ui': {
                    'notifications': False
                },
                'enable_quiet_permission_ui_enabling_method': {
                    'notifications': 1
                }
            },
            
            # 安全元数据
            'family_member_role': 'not_in_family',
            'managed_user_id': '',
            'were_old_google_logins_removed': True
        },
        
        # 浏览器使用元数据
        'browser': {
            'has_seen_welcome_page': True,
            'window_placement': {
                'work_area_bottom': 1080,
                'work_area_left': 0,
                'work_area_right': 1920,
                'work_area_top': 0
            }
        },
        
        # 安装元数据
        'countryid_at_install': 16978,              # 因国家而异
        'default_apps_install_state': 3,
        
        # 扩展元数据
        'extensions': {
            'last_chrome_version': '130.0.6723.91',  # 必须与您的版本匹配
            'alerts': {'initialized': True},
            'theme': {'system_theme': 2}
        },
        
        # 会话活动（显示定期使用）
        'in_product_help': {
            'session_start_time': str(current_time),
            'session_last_active_time': str(current_time),
            'recent_session_start_times': [
                str(current_time - (24 * 60 * 60)),
                str(current_time - (48 * 60 * 60)),
                str(current_time - (72 * 60 * 60))
            ]
        },
        
        # 会话恢复
        'session': {
            'restore_on_startup': 1,
            'startup_urls': ['https://www.google.com']
        },
        
        # 主页
        'homepage': 'https://www.google.com',
        'homepage_is_newtabpage': False,
        
        # 翻译历史（显示多语言使用）
        'translate': {'enabled': True},
        'translate_accepted_count': {'es': 2, 'fr': 1},
        'translate_denied_count_for_language': {'en': 1},
        
        # 拼写检查
        'spellcheck': {
            'dictionaries': ['en-US', 'pt-BR'],
            'dictionary': ''
        },
        
        # 语言
        'intl': {
            'selected_languages': 'en-US,en,pt-BR'
        },
        
        # 登录元数据
        'signin': {
            'allowed': True,
            'cookie_clear_on_exit_migration_notice_complete': True
        },
        
        # 安全浏览（大多数用户拥有此功能）
        'safebrowsing': {
            'enabled': True,
            'enhanced': False
        },
        
        # 自动填充（真实用户常见）
        'autofill': {
            'enabled': True,
            'profile_enabled': True
        },
        
        # 搜索建议
        'search': {'suggest_enabled': True},
        
        # DNS 预取
        'dns_prefetching': {'enabled': True},
        
        # 请勿跟踪（通常关闭）
        'enable_do_not_track': False,
        
        # WebRTC（默认设置）
        'webrtc': {
            'ip_handling_policy': 'default',
            'multiple_routes_enabled': True
        },
        
        # 隐私沙盒（Google 的 cookie 替代品 - 真实用户拥有此功能）
        'privacy_sandbox': {
            'first_party_sets_data_access_allowed_initialized': True,
            'm1': {
                'ad_measurement_enabled': True,
                'fledge_enabled': True,
                'row_notice_acknowledged': True,
                'topics_enabled': True
            }
        },
        
        # 媒体参与度
        'media': {
            'engagement': {'schema_version': 5}
        },
        
        # Web 应用
        'web_apps': {
            'did_migrate_default_chrome_apps': ['app-id'],
            'last_preinstall_synchronize_version': '130'
        }
    }
    
    return options

# 使用
async def advanced_stealth():
    options = create_realistic_browser()
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://advanced-bot-detection.com')
        # 浏览器显示为 90 天前的真实安装
```

!!! warning "版本一致性至关重要"
    **始终匹配 Chrome 版本**：确保 `profile.created_by_version` 和 `extensions.last_chrome_version` 与您的实际 Chrome 版本匹配。版本不匹配是一个立即的危险信号。
    
    ```python
    # 以编程方式获取您的 Chrome 版本：
    async with Chrome() as browser:
        tab = await browser.start()
        version = await browser.get_version()
        chrome_version = version['product'].split('/')[1]  # 例如 '130.0.6723.91'
        print(f"使用此版本：{chrome_version}")
    ```

!!! info "指纹识别首选项的作用"
    **配置文件年龄**：`creation_time` 和 `last_engagement_time` 证明浏览器不是全新安装。
    
    **使用历史**：`recent_session_start_times` 显示定期浏览模式。
    
    **翻译历史**：`translate_accepted_count` 表明真实的人使用多种语言。
    
    **窗口放置**：与实际显示器分辨率匹配的真实屏幕尺寸。
    
    **隐私沙盒**：Google 的新跟踪系统。禁用它是不寻常的和可疑的。

## 性能影响

了解浏览器首选项的性能影响可以帮助您针对特定用例进行优化：

| 首选项类别 | 预期影响 | 用例 |
|---------------------|----------------|----------|
| 禁用图像 | 加载速度提高 50-70% | 抓取文本内容 |
| 禁用预取 | 加载速度提高 10-20% | 减少带宽使用 |
| 禁用插件 | 加载速度提高 5-10% | 安全性和性能 |
| 阻止通知 | 消除弹出窗口 | 干净的自动化 |
| 静默下载 | 消除提示 | 自动化文件下载 |

!!! tip "速度与隐身的权衡"
    **追求速度**：禁用图像、预取、插件和拼写检查。
    
    **追求隐身**：启用安全浏览、自动填充、搜索建议和 DNS 预取（即使它们会减慢速度）。
    
    **平衡方法**：启用隐身功能但禁用图像和插件。这可以提供 40-50% 的加速，同时保持真实的指纹。

## 另请参阅

- **[深入探讨：浏览器首选项](../../deep-dive/browser-preferences.md)** - 架构细节和内部原理
- **[页面加载状态](page-load-state.md)** - 控制何时认为页面已加载
- **[代理配置](proxy.md)** - 配置网络代理
- **[Cookie 与会话](../browser-management/cookies-sessions.md)** - 管理浏览器状态
- **[Chromium 源代码：pref_names.cc](https://chromium.googlesource.com/chromium/src/+/main/chrome/common/pref_names.cc)** - 官方首选项常量
- **[Chromium 源代码：pref_names.h](https://github.com/chromium/chromium/blob/main/chrome/common/pref_names.h)** - 带有定义的头文件

自定义浏览器首选项为您提供了对浏览器行为的前所未有的控制，使复杂的自动化、性能优化和隐私配置成为可能，而这些在传统自动化工具中是根本不可能实现的。这种访问级别将 Pydoll 从一个简单的自动化库转变为一个完整的浏览器控制系统。


================================================
FILE: docs/zh/features/configuration/proxy.md
================================================
# 代理配置

代理对于专业的 Web 自动化至关重要，它可以帮助你绕过速率限制、访问地理限制内容并保持匿名性。Pydoll 提供原生代理支持，并具有自动身份验证处理功能。

!!! info "相关文档"
    - **[浏览器选项](browser-options.md)** - 命令行代理参数
    - **[请求拦截](../network/interception.md)** - 代理身份验证的内部工作原理
    - **[隐蔽自动化](../automation/human-interactions.md)** - 将代理与反检测结合使用
    - **[代理架构深入解析](../../deep-dive/proxy-architecture.md)** - 网络基础知识、协议、安全性和构建自己的代理

## 为什么使用代理？

代理为自动化提供了关键功能：

| 优势 | 描述 | 用例 |
|------|------|------|
| **IP 轮换** | 在多个 IP 之间分配请求 | 避免速率限制，大规模抓取 |
| **地理访问** | 访问区域锁定内容 | 测试地理定向功能，绕过限制 |
| **匿名性** | 隐藏真实 IP 地址 | 注重隐私的自动化，竞争对手分析 |
| **负载分配** | 将流量分散到多个端点 | 大容量抓取，压力测试 |
| **避免封禁** | 防止永久 IP 封禁 | 长期运行的自动化，激进抓取 |

!!! tip "何时使用代理"
    **始终使用代理：**
    
    - 生产环境 Web 抓取（>100 请求/小时）
    - 访问地理限制内容
    - 绕过速率限制或基于 IP 的封锁
    - 从不同地区进行测试
    - 保持匿名性
    
    **可以跳过代理：**
    
    - 本地开发和测试
    - 内部/企业自动化
    - 低容量自动化（<50 请求/天）
    - 抓取自己的基础设施时

## 代理类型

不同的代理协议适用于不同的目的：

| 类型 | 端口 | 身份验证 | 速度 | 安全性 | 用例 |
|------|------|---------|------|--------|------|
| **HTTP** | 80, 8080 | 可选 | 快速 | 低 | 基本 Web 抓取，非敏感数据 |
| **HTTPS** | 443, 8443 | 可选 | 快速 | 中等 | 安全 Web 抓取，加密流量 |
| **SOCKS5** | 1080, 1081 | 可选 | 中等 | 高 | 完整 TCP/UDP 支持，高级用例 |

### HTTP/HTTPS 代理

标准 Web 代理，适用于大多数自动化任务：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def http_proxy_example():
    options = ChromiumOptions()
    
    # HTTP proxy (unencrypted)
    options.add_argument('--proxy-server=http://proxy.example.com:8080')
    
    # Or HTTPS proxy (encrypted)
    # options.add_argument('--proxy-server=https://proxy.example.com:8443')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # All traffic goes through proxy
        await tab.go_to('https://httpbin.org/ip')
        
        # Verify proxy IP
        ip = await tab.execute_script('return document.body.textContent')
        print(f"Current IP: {ip}")

asyncio.run(http_proxy_example())
```

**优点：**

- 快速高效
- 在各种服务中广泛支持
- 易于配置

**缺点：**

- HTTP：无加密（流量对代理可见）
- 比 SOCKS5 更容易被检测

### SOCKS5 代理

支持完整 TCP/UDP 的高级代理：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def socks5_proxy_example():
    options = ChromiumOptions()
    
    # SOCKS5 proxy
    options.add_argument('--proxy-server=socks5://proxy.example.com:1080')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://httpbin.org/ip')

asyncio.run(socks5_proxy_example())
```

**优点：**

- 协议无关（适用于任何 TCP/UDP 流量）
- 更适合高级用例（WebSockets、WebRTC）
- 更隐蔽（更难检测）

**缺点：**

- 比 HTTP/HTTPS 稍慢
- 在免费/廉价代理服务中不太常见

!!! info "SOCKS4 vs SOCKS5"
    推荐使用 **SOCKS5** 而不是 SOCKS4，因为它：
    
    - 支持身份验证（用户名/密码）
    - 处理 UDP 流量（用于 WebRTC、DNS 等）
    - 提供更好的错误处理
    
    除非你特别需要 SOCKS4（`socks4://`），否则使用 `socks5://`。

## 身份验证代理

Pydoll 自动处理代理身份验证，无需手动干预。

### 身份验证工作原理

当你在代理 URL 中提供凭据时，Pydoll 会：

1. **拦截身份验证挑战** 使用 Fetch 域
2. **自动响应** 提供凭据
3. **继续导航** 无缝衔接

这一切都是透明的，你无需手动处理身份验证！

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def authenticated_proxy_example():
    options = ChromiumOptions()
    
    # Proxy with authentication (username:password)
    options.add_argument('--proxy-server=http://user:pass@proxy.example.com:8080')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Authentication handled automatically!
        await tab.go_to('https://example.com')
        print("Connected through authenticated proxy")

asyncio.run(authenticated_proxy_example())
```

!!! tip "凭据格式"
    直接在代理 URL 中包含凭据：

    - HTTP: `http://username:password@host:port`
    - HTTPS: `https://username:password@host:port`
    - SOCKS5: `socks5://username:password@host:port`

    Pydoll 会自动提取并使用这些凭据。

!!! warning "SOCKS5 身份验证限制"
    **Chrome 不原生支持 SOCKS5 身份验证**（[Chromium Issue #40323993](https://issues.chromium.org/issues/40323993)）。嵌入在 `socks5://user:pass@host:port` 中的凭据会被静默忽略 — Chrome 只会向 SOCKS5 代理发送"无需身份验证"的问候。

    这意味着 Pydoll 的自动代理身份验证（通过 `Fetch.authRequired`）**对 SOCKS5 不起作用**，因为 Chrome 从不会为 SOCKS5 连接发出 HTTP 407 质询。

    **解决方案 — 本地代理转发器：**

    运行一个本地 SOCKS5 代理（无需身份验证），将流量转发到远程的身份验证代理。Pydoll 提供了一个即用脚本：

    ```python
    import asyncio
    from pydoll.utils import SOCKS5Forwarder
    from pydoll.browser.chromium import Chrome
    from pydoll.browser.options import ChromiumOptions

    async def main():
        forwarder = SOCKS5Forwarder(
            remote_host='proxy.example.com',
            remote_port=1080,
            username='myuser',
            password='mypass',
            local_port=1081,
        )
        async with forwarder:
            options = ChromiumOptions()
            options.add_argument('--proxy-server=socks5://127.0.0.1:1081')

            async with Chrome(options=options) as browser:
                tab = await browser.start()
                await tab.go_to('https://httpbin.org/ip')

    asyncio.run(main())
    ```

    转发器负责与远程代理进行用户名/密码握手，而 Chrome 无需身份验证即可连接到本地主机。

    有关此问题的完整技术解释，请参阅 **[SOCKS5 身份验证深入解析](../../deep-dive/network/socks-proxies.md#socks5-身份验证与-chrome)**。

### 身份验证实现细节

Pydoll 在浏览器级别使用 Chrome 的 **Fetch 域** 来拦截和处理身份验证挑战：

```python
# 这是 Pydoll 内部处理的
# 你不需要编写这段代码！

async def _handle_proxy_auth(event):
    """Pydoll 的内部代理身份验证处理器。"""
    if event['params']['authChallenge']['source'] == 'Proxy':
        await browser.continue_request_with_auth(
            request_id=event['params']['requestId'],
            username='user',
            password='pass'
        )
```

!!! info "底层原理"
    有关 Pydoll 如何拦截和处理代理身份验证的技术细节，请参阅：
    
    - **[请求拦截](../network/interception.md)** - Fetch 域和请求处理
    - **[事件系统](../advanced/event-system.md)** - 事件驱动的身份验证

!!! warning "Fetch 域冲突"
    当使用**身份验证代理** + **标签页级别请求拦截**时，请注意：
    
    - Pydoll 在**浏览器级别**启用 Fetch 以进行代理身份验证
    - 如果在**标签页级别**启用 Fetch，它们共享同一个域
    - **解决方案**：在启用标签页级别拦截之前调用一次 `tab.go_to()`
    
    ```python
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # 1. 首次导航触发代理身份验证（浏览器级别 Fetch）
        await tab.go_to('https://example.com')
        
        # 2. 然后安全地启用标签页级别拦截
        await tab.enable_fetch_events()
        await tab.on('Fetch.requestPaused', my_interceptor)
        
        # 3. 继续自动化
        await tab.go_to('https://example.com/page2')
    ```
    
    详细信息请参阅 [请求拦截 - 代理 + 拦截](../network/interception.md#private-proxy-request-interception-fetch)。

## 代理绕过列表

从使用代理中排除特定域：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def proxy_bypass_example():
    options = ChromiumOptions()
    
    # Use proxy for most traffic
    options.add_argument('--proxy-server=http://proxy.example.com:8080')
    
    # But bypass proxy for these domains
    options.add_argument('--proxy-bypass-list=localhost,127.0.0.1,*.local,internal.company.com')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Uses proxy
        await tab.go_to('https://external-site.com')
        
        # Bypasses proxy (direct connection)
        await tab.go_to('http://localhost:8000')
        await tab.go_to('http://internal.company.com')

asyncio.run(proxy_bypass_example())
```

**绕过列表模式：**

| 模式 | 匹配 | 示例 |
|------|------|------|
| `localhost` | 仅本地主机 | `http://localhost` |
| `127.0.0.1` | 回环 IP | `http://127.0.0.1` |
| `*.local` | 所有 `.local` 域 | `http://server.local` |
| `internal.company.com` | 特定域 | `http://internal.company.com` |
| `192.168.1.*` | IP 范围 | `http://192.168.1.100` |

!!! tip "何时使用绕过列表"
    为以下情况绕过代理：
    
    - **本地开发服务器**（`localhost`、`127.0.0.1`）
    - **公司内部资源**（VPN、内网）
    - **测试环境**（`.local`、`.test` 域）
    - **高带宽资源**（当代理较慢时）

## PAC（代理自动配置）

使用 PAC 文件实现复杂的代理路由规则：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def pac_proxy_example():
    options = ChromiumOptions()
    
    # Load PAC file from URL
    options.add_argument('--proxy-pac-url=http://proxy.example.com/proxy.pac')
    
    # Or use local PAC file
    # options.add_argument('--proxy-pac-url=file:///path/to/proxy.pac')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')

asyncio.run(pac_proxy_example())
```

**Example PAC file:**

```javascript
function FindProxyForURL(url, host) {
    // Direct connection for local addresses
    if (isInNet(host, "192.168.0.0", "255.255.0.0") ||
        isInNet(host, "127.0.0.0", "255.0.0.0")) {
        return "DIRECT";
    }
    
    // Use specific proxy for certain domains
    if (dnsDomainIs(host, ".example.com")) {
        return "PROXY proxy1.example.com:8080";
    }
    
    // Default proxy for everything else
    return "PROXY proxy2.example.com:8080";
}
```

!!! info "PAC 文件用例"
    PAC 文件适用于：
    
    - **复杂路由规则**（基于域名、基于 IP）
    - **代理故障转移**（尝试多个代理）
    - **负载均衡**（在代理池中分配）
    - **企业环境**（集中式代理管理）

## 轮换代理

轮换使用多个代理以实现更好的分配：

```python
import asyncio
from itertools import cycle
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def rotating_proxy_example():
    # List of proxies
    proxies = [
        'http://user:pass@proxy1.example.com:8080',
        'http://user:pass@proxy2.example.com:8080',
        'http://user:pass@proxy3.example.com:8080',
    ]
    
    # Cycle through proxies
    proxy_pool = cycle(proxies)
    
    # Scrape multiple URLs with different proxies
    urls = [
        'https://example.com/page1',
        'https://example.com/page2',
        'https://example.com/page3',
    ]
    
    for url in urls:
        # Get next proxy
        proxy = next(proxy_pool)
        
        # Configure options with this proxy
        options = ChromiumOptions()
        options.add_argument(f'--proxy-server={proxy}')
        
        # Use proxy for this browser instance
        async with Chrome(options=options) as browser:
            tab = await browser.start()
            await tab.go_to(url)
            
            title = await tab.execute_script('return document.title')
            print(f"[{proxy.split('@')[1]}] {url}: {title}")

asyncio.run(rotating_proxy_example())
```

!!! tip "代理轮换策略"
    **每个浏览器轮换**（如上）：

    - 每个浏览器实例使用不同的代理
    - 最适合隔离和避免会话冲突
    
    **每个请求轮换**：

    - 更复杂，需要请求拦截
    - 实现方式请参阅 [请求拦截](../network/interception.md)

## 住宅代理 vs 数据中心代理

理解代理类型有助于你选择正确的服务：

| 特性 | 住宅代理 | 数据中心代理 |
|------|---------|-------------|
| **IP 来源** | 真实住宅 ISP | 数据中心 |
| **合法性** | 高（真实用户） | 低（已知范围） |
| **检测风险** | 非常低 | 高 |
| **速度** | 中等（150-500ms） | 非常快（<50ms） |
| **成本** | 昂贵（$5-15/GB） | 便宜（$0.10-1/GB） |
| **最适合** | 反机器人网站、电商 | API、内部工具 |

### 住宅代理

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def residential_proxy_example():
    """Use residential proxy for anti-bot sites."""
    options = ChromiumOptions()
    
    # Residential proxy with high trust score
    options.add_argument('--proxy-server=http://user:pass@residential.proxy.com:8080')
    
    # Combine with stealth options
    options.add_argument('--disable-blink-features=AutomationControlled')
    options.add_argument('--user-agent=Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/130.0.0.0 Safari/537.36')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Access protected site
        await tab.go_to('https://protected-site.com')
        print("Successfully accessed through residential proxy")

asyncio.run(residential_proxy_example())
```

**何时使用住宅代理：**

- 具有强大反机器人保护的网站（Cloudflare、DataDome）
- 电商抓取（Amazon、eBay 等）
- 社交媒体自动化
- 金融服务
- 任何主动封锁数据中心 IP 的网站

### 数据中心代理

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def datacenter_proxy_example():
    """Use fast datacenter proxy for APIs and unprotected sites."""
    options = ChromiumOptions()
    
    # Fast datacenter proxy
    options.add_argument('--proxy-server=http://user:pass@datacenter.proxy.com:8080')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        
        # Fast API scraping
        await tab.go_to('https://api.example.com/data')

asyncio.run(datacenter_proxy_example())
```

**何时使用数据中心代理：**

- 无速率限制的公共 API
- 内部/企业自动化
- 没有反机器人措施的网站
- 大容量、速度关键的抓取
- 开发和测试

!!! warning "代理质量很重要"
    **劣质代理**带来的问题比解决的问题更多：
    
    - 响应时间慢（超时）
    - 连接失败（错误率高）
    - IP 被列入黑名单（立即封禁）
    - 真实 IP 泄露（隐私泄露）
    
    **投资高质量代理**，选择信誉良好的提供商。免费代理几乎从不值得使用。

## 测试你的代理

在运行生产环境自动化之前验证代理配置：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def test_proxy():
    """Test proxy connection and configuration."""
    proxy_url = 'http://user:pass@proxy.example.com:8080'
    
    options = ChromiumOptions()
    options.add_argument(f'--proxy-server={proxy_url}')
    
    try:
        async with Chrome(options=options) as browser:
            tab = await browser.start()
            
            # Test 1: Connection
            print("Testing proxy connection...")
            await tab.go_to('https://httpbin.org/ip', timeout=10)
            
            # Test 2: IP verification
            print("Verifying proxy IP...")
            ip_response = await tab.execute_script('return document.body.textContent')
            print(f"[OK] Proxy IP: {ip_response}")
            
            # Test 3: Geographic location (if available)
            await tab.go_to('https://ipapi.co/json/')
            geo_data = await tab.execute_script('return document.body.textContent')
            print(f"[OK] Geographic data: {geo_data}")
            
            # Test 4: Speed test
            import time
            start = time.time()
            await tab.go_to('https://example.com')
            load_time = time.time() - start
            print(f"[OK] Load time: {load_time:.2f}s")
            
            if load_time > 5:
                print("[WARNING] Slow proxy response time")
            
            print("\n[SUCCESS] All proxy tests passed!")
            
    except asyncio.TimeoutError:
        print("[ERROR] Proxy connection timeout")
    except Exception as e:
        print(f"[ERROR] Proxy test failed: {e}")

asyncio.run(test_proxy())
```

## 延伸阅读

- **[代理架构深入解析](../../deep-dive/proxy-architecture.md)** - 网络基础知识、TCP/UDP、HTTP/2/3、SOCKS5 内部原理、安全分析以及构建自己的代理服务器
- **[浏览器选项](browser-options.md)** - 命令行参数和配置
- **[请求拦截](../network/interception.md)** - 代理身份验证工作原理
- **[浏览器首选项](browser-preferences.md)** - 隐蔽性和指纹识别
- **[上下文](../browser-management/contexts.md)** - 每个上下文使用不同的代理

!!! tip "从简单开始"
    从简单的代理设置开始，彻底测试，然后根据需要添加复杂性（轮换、重试逻辑、监控）。高质量的代理比复杂的轮换策略更重要。
    
    对于那些有兴趣深入了解代理的人，**[代理架构深入解析](../../deep-dive/proxy-architecture.md)** 提供了网络协议、安全注意事项的全面介绍，甚至指导你构建自己的代理服务器。


================================================
FILE: docs/zh/features/core-concepts.md
================================================
# 核心概念

理解是什么使 Pydoll 与众不同，要从其基础设计决策开始。这些不仅仅是技术选择，它们直接影响您如何编写自动化脚本、可以解决什么问题，以及解决方案的可靠性。

## 零 WebDriver

Pydoll 最显著的优势之一是完全消除了 WebDriver 依赖。如果您曾经遇到过"chromedriver 版本与 Chrome 版本不匹配"错误，或处理过神秘的驱动程序崩溃，您会欣赏这种方法。

### 工作原理

像 Selenium 这样的传统浏览器自动化工具依赖于 WebDriver 可执行文件，它充当代码和浏览器之间的中介。Pydoll 采用不同的路径，通过 Chrome DevTools Protocol (CDP) 直接连接到浏览器。

```mermaid
graph LR
    %% Pydoll 流程
    subgraph P["Pydoll 流程"]
        direction LR
        P1["💻 您的代码"] --> P2["🪄 Pydoll"]
        P2 --> P3["🌐 浏览器 (通过 CDP)"]
    end

    %% 传统 Selenium 流程
    subgraph S["传统 Selenium 流程"]
        direction LR
        S1["💻 您的代码"] --> S2["🔌 WebDriver 客户端"]
        S2 --> S3["⚙️ WebDriver 可执行文件"]
        S3 --> S4["🌐 浏览器"]
    end

```

当您使用 Pydoll 启动浏览器时，底层发生的事情如下：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def main():
    # 这会创建一个 Browser 实例
    browser = Chrome()
    
    # start() 使用 --remote-debugging-port 启动 Chrome
    # 并建立到 CDP 端点的 WebSocket 连接
    tab = await browser.start()
    
    # 现在您可以通过 CDP 命令控制浏览器
    await tab.go_to('https://example.com')
    
    await browser.stop()

asyncio.run(main())
```

在幕后，`browser.start()` 执行以下操作：

1. **使用** `--remote-debugging-port=<port>` 标志**启动浏览器进程**
2. **等待 CDP 服务器**在该端口上可用
3. **建立 WebSocket 连接**到 `ws://localhost:<port>/devtools/...`
4. **返回准备好自动化的 Tab 实例**

!!! info "想了解更多？"
    有关浏览器进程如何在内部管理的技术细节，请参阅[浏览器域](../../deep-dive/browser-domain.md#browser-process-manager)深入探讨。

### 您会注意到的好处

**没有版本管理的烦恼**
```python
# 使用 Selenium，您可能会看到：
# SessionNotCreatedException: This version of ChromeDriver only supports Chrome version 120

# 使用 Pydoll，您只需要安装 Chrome：
async with Chrome() as browser:
    tab = await browser.start()  # 适用于任何 Chrome 版本
```

**更简单的设置**
```bash
# Selenium 设置：
$ pip install selenium
$ brew install chromedriver  # 或下载、chmod +x、添加到 PATH...
$ chromedriver --version     # 它与您的 Chrome 匹配吗？

# Pydoll 设置：
$ pip install pydoll-python  # 就这样！
```

**更可靠**

没有 WebDriver 作为中间层，失败点更少。您的代码通过 Chromium 开发人员自己使用和维护的定义良好的协议直接与浏览器通信。

### CDP：魔法背后的协议

Chrome DevTools Protocol 不仅适用于 Pydoll；当您打开检查器时，它是为 Chrome DevTools 提供动力的相同协议。这意味着：

- **经过实战检验的可靠性**：每天被数百万开发人员使用
- **丰富的功能**：DevTools 能做的一切，Pydoll 都能做
- **积极开发**：Google 持续维护和发展 CDP

!!! tip "深入探讨：理解 CDP"
    要全面了解 CDP 的工作原理以及为什么它优于 WebDriver，请参阅我们的 [Chrome DevTools Protocol](../../deep-dive/cdp.md) 深入探讨。

## 异步优先架构

Pydoll 不仅仅是异步兼容；它从头开始设计以利用 Python 的 `asyncio` 框架。这不是一个复选框功能；它是 Pydoll 如何实现高性能的基础。

!!! info "异步编程新手？"
    如果您不熟悉 Python 的 `async`/`await` 语法或 asyncio 概念，我们强烈建议首先阅读我们的[理解 Async/Await](../../deep-dive/connection-layer.md#understanding-asyncawait) 指南。它用实际示例解释了基础知识，将帮助您理解 Pydoll 的异步架构如何工作以及为什么它对浏览器自动化如此强大。

### 为什么异步对浏览器自动化很重要

浏览器自动化涉及大量等待：页面加载、元素出现、网络请求完成。传统的同步工具在这些等待期间浪费 CPU 时间。异步架构让您在等待时做有用的工作。

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def scrape_page(browser, url):
    """抓取单个页面。"""
    tab = await browser.new_tab()
    await tab.go_to(url)
    title = await tab.execute_script('return document.title')
    await tab.close()
    return title

async def main():
    urls = [
        'https://example.com/page1',
        'https://example.com/page2',
        'https://example.com/page3',
    ]
    
    async with Chrome() as browser:
        await browser.start()
        
        # 并发处理所有 URL！
        titles = await asyncio.gather(
            *(scrape_page(browser, url) for url in urls)
        )
        
        print(titles)

asyncio.run(main())
```

在这个例子中，不是一个接一个地抓取页面（可能需要 3 × 2 秒 = 6 秒），而是并发抓取所有三个页面，总共大约需要 2 秒。

### 真正的并发与线程

与基于线程的方法不同，Pydoll 的异步架构提供真正的并发执行，而无需线程管理的复杂性：

```mermaid
sequenceDiagram
    participant Main as 主任务
    participant Tab1 as 标签页 1
    participant Tab2 as 标签页 2
    participant Tab3 as 标签页 3
    
    Main->>Tab1: go_to(url1)
    Main->>Tab2: go_to(url2)
    Main->>Tab3: go_to(url3)
    
    Note over Tab1,Tab3: 所有标签页并发导航
    
    Tab1-->>Main: 页面 1 已加载
    Tab2-->>Main: 页面 2 已加载
    Tab3-->>Main: 页面 3 已加载
    
    Main->>Main: 处理结果
```

### 现代 Python 模式

Pydoll 在整个过程中采用现代 Python 习语：

**上下文管理器**
```python
# 自动资源清理
async with Chrome() as browser:
    tab = await browser.start()
    # ... 执行工作 ...
# 退出上下文时浏览器自动停止
```

**操作的异步上下文管理器**
```python
# 等待和处理下载
async with tab.expect_download(keep_file_at='/downloads') as dl:
    await (await tab.find(text='Download PDF')).click()
    pdf_data = await dl.read_bytes()
```

!!! tip "深入探讨"
    想了解异步操作在底层如何工作？查看[连接层](../../deep-dive/connection-layer.md)深入探讨以获取实现细节。

### 性能影响

异步优先设计提供了可衡量的性能改进：

```python
import asyncio
import time
from pydoll.browser.chromium import Chrome

async def benchmark_concurrent():
    """并发抓取 10 个页面。"""
    async with Chrome() as browser:
        await browser.start()
        
        start = time.time()
        tasks = [
            browser.new_tab(f'https://example.com/page{i}')
            for i in range(10)
        ]
        await asyncio.gather(*tasks)
        elapsed = time.time() - start
        
        print(f"10 个页面在 {elapsed:.2f}s 内加载完成")
        # 典型结果：约 2-3 秒，而不是顺序执行的 20+ 秒

asyncio.run(benchmark_concurrent())
```

## 多浏览器支持

Pydoll 为所有基于 Chromium 的浏览器提供统一的 API。编写一次自动化，随处运行。

### 支持的浏览器

**Google Chrome**：主要目标，具有完整的功能支持。
```python
from pydoll.browser.chromium import Chrome

async with Chrome() as browser:
    tab = await browser.start()
```

**Microsoft Edge**：完全支持，包括 Edge 特定功能。
```python
from pydoll.browser.chromium import Edge

async with Edge() as browser:
    tab = await browser.start()
```

**其他 Chromium 浏览器**：Brave、Vivaldi、Opera 等。
```python
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

options = ChromiumOptions()
options.binary_location = '/path/to/brave-browser'  # 或任何 Chromium 浏览器

async with Chrome(options=options) as browser:
    tab = await browser.start()
```

关键好处：所有基于 Chromium 的浏览器共享相同的 API。编写一次自动化，它就可以在 Chrome、Edge、Brave 或任何其他 Chromium 浏览器上运行，无需更改代码。

### 跨浏览器测试

在多个浏览器中测试您的自动化而无需更改代码：

```python
import asyncio
from pydoll.browser.chromium import Chrome, Edge

async def test_login(browser_class, browser_name):
    """在特定浏览器中测试登录流程。"""
    async with browser_class() as browser:
        tab = await browser.start()
        await tab.go_to('https://app.example.com/login')
        
        await (await tab.find(id='username')).type_text('user@example.com')
        await (await tab.find(id='password')).type_text('password123')
        await (await tab.find(id='login-btn')).click()
        
        # 验证登录成功
        success = await tab.find(id='dashboard', raise_exc=False)
        print(f"{browser_name} 登录: {'✓' if success else '✗'}")

async def main():
    # 在 Chrome 和 Edge 中测试
    await test_login(Chrome, "Chrome")
    await test_login(Edge, "Edge")

asyncio.run(main())
```

## 类人行为

自动化浏览器通常可被检测到，因为它们的行为很机械。Pydoll 包含内置功能，使交互看起来更像人类。

### 自然打字

真实用户不会以完全一致的速度打字。Pydoll 的 `type_text()` 方法包括按键之间的随机延迟：

```python
# 以类人的时间打字
username_field = await tab.find(id='username')
await username_field.type_text(
    'user@example.com',
    interval=0.1  # 按键之间平均 100ms，带有随机化
)

# 更快的打字（仍然类人）
await username_field.type_text(
    'user@example.com',
    interval=0.05  # 更快但仍然有变化
)

# 即时（机械；仅在速度比隐蔽性更重要时使用）
await username_field.type_text(
    'user@example.com',
    interval=0
)
```

`interval` 参数设置平均延迟，但 Pydoll 添加随机变化以使时间更自然。

### 真实的点击

点击不仅仅是"触发即忘"。Pydoll 自动分发真实用户会触发的所有鼠标事件：

```python
button = await tab.find(id='submit-button')

# 默认行为：点击元素中心
# 自动触发：mouseover, mouseenter, mousemove, mousedown, mouseup, click
await button.click()

# 带偏移点击（用于避免在较大元素上被检测）
await button.click(offset_x=10, offset_y=5)
```

!!! info "鼠标事件"
    Pydoll 按正确顺序分发完整的鼠标事件序列，模拟真实浏览器如何处理用户点击。这使得点击比简单的 JavaScript `.click()` 调用更真实。

!!! warning "检测注意事项"
    虽然类人行为有助于避免基本的机器人检测，但复杂的反自动化系统使用许多信号。将这些功能与以下内容结合使用：
    
    - 真实的浏览器指纹（通过浏览器首选项）
    - 适当的代理配置
    - 操作之间的合理延迟
    - 变化的导航模式

## 事件驱动设计

与传统的基于轮询的自动化不同，Pydoll 允许您在浏览器事件发生时做出反应。这更高效，并且可以实现复杂的交互模式。

### 实时事件监控

订阅浏览器事件并在它们触发时执行回调：

```python
import asyncio
from functools import partial
from pydoll.browser.chromium import Chrome
from pydoll.protocol.page.events import PageEvent
from pydoll.protocol.network.events import NetworkEvent

async def main():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # 响应页面加载事件
        async def on_page_load(event):
            print(f"页面已加载: {await tab.current_url}")
        
        await tab.enable_page_events()
        await tab.on(PageEvent.LOAD_EVENT_FIRED, on_page_load)
        
        # 监控网络请求
        async def on_request(tab, event):
            url = event['params']['request']['url']
            if '/api/' in url:
                print(f"API 调用: {url}")
        
        await tab.enable_network_events()
        await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, partial(on_request, tab))
        
        # 导航并观察事件触发
        await tab.go_to('https://example.com')
        await asyncio.sleep(3)  # 让事件处理

asyncio.run(main())
```

### 事件类别

Pydoll 公开了几个您可以订阅的 CDP 事件域：

| 域 | 示例事件 |
|--------|----------------|
| **页面事件** | 加载完成、导航、JavaScript 对话框 |
| **网络事件** | 请求发送、响应接收、WebSocket 活动 |
| **DOM 事件** | DOM 更改、属性修改 |
| **Fetch 事件** | 请求暂停、需要身份验证 |
| **运行时事件** | 控制台消息、异常 |

### 实用的事件驱动模式

**捕获 API 响应**
```python
import json
from functools import partial
from pydoll.protocol.network.events import NetworkEvent

api_data = []

async def capture_api(tab, event):
    url = event['params']['response']['url']
    if '/api/data' in url:
        request_id = event['params']['requestId']
        body = await tab.get_network_response_body(request_id)
        api_data.append(json.loads(body))

await tab.enable_network_events()
await tab.on(NetworkEvent.RESPONSE_RECEIVED, partial(capture_api, tab))

# 导航并自动捕获 API 响应
await tab.go_to('https://app.example.com')
await asyncio.sleep(2)

print(f"捕获了 {len(api_data)} 个 API 响应")
```

**等待特定条件**
```python
import asyncio
from functools import partial
from pydoll.protocol.network.events import NetworkEvent

async def wait_for_api_call(tab, endpoint):
    """等待调用特定的 API 端点。"""
    event_occurred = asyncio.Event()
    
    async def check_endpoint(tab, event):
        url = event['params']['request']['url']
        if endpoint in url:
            event_occurred.set()
    
    await tab.enable_network_events()
    callback_id = await tab.on(
        NetworkEvent.REQUEST_WILL_BE_SENT,
        partial(check_endpoint, tab),
        temporary=True  # 首次触发后自动移除
    )

    await event_occurred.wait()
    print(f"API 端点 {endpoint} 被调用！")

# 用法
await wait_for_api_call(tab, '/api/users')
```

!!! info "深入探讨：事件系统详情"
    有关事件处理、回调模式和性能注意事项的综合指南，请参阅[事件系统](../../deep-dive/event-system.md)深入探讨。

### 事件性能

事件很强大但会带来开销。最佳实践：

```python
# ✓ 好：仅启用您需要的
await tab.enable_network_events()

# ✗ 避免：不必要地启用所有事件
await tab.enable_page_events()
await tab.enable_network_events()
await tab.enable_dom_events()
await tab.enable_fetch_events()
await tab.enable_runtime_events()

# ✓ 好：在回调中提前过滤
async def handle_request(event):
    url = event['params']['request']['url']
    if '/api/' not in url:
        return  # 提前跳过非 API 请求
    # 处理 API 请求...

# ✓ 好：完成后禁用
await tab.disable_network_events()
```

## 将所有内容整合在一起

这些核心概念共同创建了一个强大的自动化框架：

```python
import asyncio
import json
from functools import partial
from pydoll.browser.chromium import Chrome
from pydoll.protocol.network.events import NetworkEvent
from pydoll.constants import Keys

async def advanced_scraping():
    """演示多个核心概念协同工作。"""
    async with Chrome() as browser:  # 异步上下文管理器
        tab = await browser.start()
        
        # 事件驱动：捕获 API 数据
        api_responses = []
        
        async def capture_data(tab, event):
            url = event['params']['response']['url']
            if '/api/products' in url:
                request_id = event['params']['requestId']
                body = await tab.get_network_response_body(request_id)
                api_responses.append(json.loads(body))
        
        await tab.enable_network_events()
        await tab.on(NetworkEvent.RESPONSE_RECEIVED, partial(capture_data, tab))
        
        # 使用零 webdriver 的简单性导航
        await tab.go_to('https://example.com/products')
        
        # 类人交互
        search = await tab.find(id='search')
        await search.type_text('laptop', interval=0.1)  # 自然打字
        await search.press_keyboard_key(Keys.ENTER)
        
        # 等待 API 响应（异步效率）
        await asyncio.sleep(2)
        
        print(f"从 API 捕获了 {len(api_responses)} 个产品")
        return api_responses

# 多浏览器支持：适用于 Chrome、Edge 等
asyncio.run(advanced_scraping())
```

这些基础概念贯穿于 Pydoll 的所有其他部分。当您探索特定功能时，您会看到这些原则在起作用，共同创建可靠、高效和可维护的浏览器自动化。

---

## 下一步是什么？

现在您了解了 Pydoll 的核心设计，您已准备好探索特定功能：

- **[元素查找](element-finding.md)** - 学习 Pydoll 直观的元素定位 API
- **[网络功能](../network/monitoring.md)** - 利用事件系统进行网络分析
- **[浏览器管理](../browser-management/tabs.md)** - 使用异步模式进行并发操作

要获得更深入的技术理解，请探索[深入探讨](../../deep-dive/index.md)部分。

================================================
FILE: docs/zh/features/element-finding.md
================================================
# 元素查找

在网页上查找元素是浏览器自动化的基础。Pydoll 引入了一种革命性的、直观的方法，使元素定位比传统的基于选择器的方法更强大且更易于使用。

## 为什么 Pydoll 的方法与众不同

传统的浏览器自动化工具从一开始就强迫您使用 CSS 选择器和 XPath 表达式进行思考。Pydoll 颠覆了这一点：您使用自然的 HTML 属性描述您要查找的内容，Pydoll 会找出最佳的选择器策略。

```python
# 传统方法（其他工具）
element = driver.find_element(By.XPATH, "//input[@type='email' and @name='username']")

# Pydoll 的方法
element = await tab.find(tag_name="input", type="email", name="username")
```

两者找到相同的元素，但 Pydoll 的语法更清晰、更易维护、更不容易出错。

### 元素查找方法概述

Pydoll 提供三种主要的元素查找方法：

| 方法 | 使用场景 | 示例 |
|--------|----------|---------|
| **`find()`** | 您知道 HTML 属性 | `await tab.find(id="username")` |
| **`query()`** | 您有 CSS/XPath 选择器 | `await tab.query("div.content")` |
| **遍历** | 您想从已知元素探索 | `await element.get_children_elements()` |

```mermaid
flowchart LR
    A[需要元素?] --> B{您有什么?}
    B -->|HTML 属性| C[find 方法]
    B -->|CSS/XPath| D[query 方法]
    B -->|父元素| E[遍历]
    
    C --> F[WebElement]
    D --> F
    E --> G[WebElement 列表]
```

!!! info "深入探讨：工作原理"
    好奇 Pydoll 如何在底层实现元素查找？查看 [FindElements Mixin](../deep-dive/find-elements-mixin.md) 文档，了解架构、性能优化和内部选择器策略。

## find() 方法：自然元素选择

`find()` 方法是您定位元素的主要工具。它接受常见的 HTML 属性作为参数，并自动构建最有效的选择器。

### 基本用法

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def basic_finding():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # 按 ID 查找（最常见且最快）
        username = await tab.find(id="username")
        
        # 按类名查找
        submit_button = await tab.find(class_name="btn-primary")
        
        # 按标签名查找
        first_paragraph = await tab.find(tag_name="p")
        
        # 按 name 属性查找
        email_field = await tab.find(name="email")
        
        # 按文本内容查找
        login_link = await tab.find(text="Login")

asyncio.run(basic_finding())
```

### 组合属性以提高精度

`find()` 的真正威力来自组合多个属性来创建精确的选择器：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def precise_finding():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/form')
        
        # 组合标签名和类型
        password_input = await tab.find(tag_name="input", type="password")
        
        # 组合标签、类和自定义属性
        submit_button = await tab.find(
            tag_name="button",
            class_name="btn",
            type="submit"
        )
        
        # 使用 data 属性
        product_card = await tab.find(
            tag_name="div",
            data_testid="product-card",
            data_category="electronics"
        )
        
        # 组合多个条件
        specific_link = await tab.find(
            tag_name="a",
            class_name="nav-link",
            href="/dashboard"
        )

asyncio.run(precise_finding())
```

!!! info "组合逻辑：AND"
    在 `find()` 中组合属性作为 AND 操作。元素必须匹配**所有**提供的属性。
    
    对于需要 OR 逻辑的更复杂场景 - 例如查找可能具有 `id` 或不同 `name` 的元素 - 正确的方法是链接多个 `find()` 调用，如"完整示例"部分所示。

!!! tip "属性命名约定"
    对于带连字符的属性名使用下划线。例如，`data-testid` 变成 `data_testid`，`aria-label` 变成 `aria_label`。Pydoll 会自动将它们转换为正确的格式。

### find() 如何选择最佳策略

Pydoll 根据您提供的属性自动选择最有效的选择器：

| 提供的属性 | 使用的策略 | 性能 |
|---------------------|---------------|-------------|
| 单个：`id` | `By.ID` | ⚡ 最快 |
| 单个：`class_name` | `By.CLASS_NAME` | ⚡ 快 |
| 单个：`name` | `By.NAME` | ⚡ 快 |
| 单个：`tag_name` | `By.TAG_NAME` | ⚡ 快 |
| 单个：`text` | `By.XPATH` | ⚡ 快 |
| 多个属性 | XPath 表达式 | ✓ 高效 |

```mermaid
flowchart LR
    A[find 属性] --> B{单个还是多个?}
    B -->|单个| C[直接选择器]
    B -->|多个| D[构建 XPath]
    C --> E[快速执行]
    D --> E
```

### 查找多个元素

使用 `find_all=True` 获取所有匹配元素的列表：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def find_multiple():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/products')
        
        # 查找所有产品卡片
        products = await tab.find(class_name="product-card", find_all=True)
        print(f"找到 {len(products)} 个产品")
        
        # 查找导航中的所有链接
        nav_links = await tab.find(
            tag_name="a",
            class_name="nav-link",
            find_all=True
        )
        
        # 处理每个元素
        for link in nav_links:
            text = await link.text
            href = await link.get_attribute("href")
            print(f"链接: {text} → {href}")

asyncio.run(find_multiple())
```

### 等待动态元素

现代 Web 应用程序动态加载内容。使用 `timeout` 等待元素出现：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def wait_for_elements():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/dashboard')
        
        # 等待最多 10 秒让元素出现
        dynamic_content = await tab.find(
            class_name="dynamic-content",
            timeout=10
        )
        
        # 等待 AJAX 加载的数据
        user_profile = await tab.find(
            id="user-profile",
            timeout=15
        )
        
        # 处理可能不会出现的元素
        optional_banner = await tab.find(
            class_name="promo-banner",
            timeout=3,
            raise_exc=False  # 如果未找到则返回 None
        )
        
        if optional_banner:
            await optional_banner.click()
        else:
            print("没有促销横幅")

asyncio.run(wait_for_elements())
```

!!! warning "超时最佳实践"
    使用合理的超时值。太短会错过加载缓慢的元素；太长会浪费时间等待不存在的元素。对于大多数动态内容，从 5-10 秒开始。

## query() 方法：直接选择器访问

对于喜欢传统选择器或需要更复杂选择逻辑的开发人员，`query()` 方法提供对 CSS 选择器和 XPath 表达式的直接访问。

### CSS 选择器

CSS 选择器速度快、广为人知，非常适合大多数用例：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def css_selector_examples():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # 简单选择器
        main_nav = await tab.query("nav.main-menu")
        first_article = await tab.query("article:first-child")
        
        # 属性选择器
        submit_button = await tab.query("button[type='submit']")
        required_inputs = await tab.query("input[required]", find_all=True)
        
        # 复杂选择器
        nested = await tab.query("div.container > .content .item:nth-child(2)")
        
        # 伪类
        first_enabled_button = await tab.query("button:not([disabled])")

asyncio.run(css_selector_examples())
```

### XPath 表达式

XPath 擅长复杂的关系和文本匹配：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def xpath_examples():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/table')
        
        # 文本匹配
        button = await tab.query("//button[contains(text(), 'Submit')]")
        
        # 导航到父元素
        input_parent = await tab.query("//input[@name='email']/parent::div")
        
        # 查找兄弟元素
        label_input = await tab.query(
            "//label[text()='Email:']/following-sibling::input"
        )
        
        # 复杂的表格查询
        edit_button = await tab.query(
            "//tr[td[text()='John Doe']]//button[@class='btn-edit']"
        )

asyncio.run(xpath_examples())
```

!!! info "CSS vs XPath：使用哪个？"
    有关在 CSS 选择器和 XPath 之间进行选择的综合指南，包括语法参考和实际示例，请参阅[选择器指南](../deep-dive/selectors-guide.md)。

## DOM 遍历：子元素和兄弟元素

有时您需要从已知的起点探索 DOM 树。Pydoll 提供专门的方法来遍历元素关系。

### DOM 树结构

理解 DOM 树结构有助于您选择正确的遍历方法：

```mermaid
graph TB
    Root[文档根]
    Root --> Container[div id='container']
    
    Container --> Child1[div class='card']
    Container --> Child2[div class='card']
    Container --> Child3[div class='card']
    
    Child1 --> GrandChild1[h2 标题]
    Child1 --> GrandChild2[p 描述]
    Child1 --> GrandChild3[button 操作]
    
    Child2 --> GrandChild4[h2 标题]
    Child2 --> GrandChild5[p 描述]
    
    Child3 --> GrandChild6[h2 标题]
```

### 获取子元素

`get_children_elements()` 方法检索元素的后代：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def traverse_children():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/cards')
        
        # 获取容器
        container = await tab.find(id="cards-container")
        
        # 仅获取直接子元素（max_depth=1）
        direct_children = await container.get_children_elements(max_depth=1)
        print(f"容器有 {len(direct_children)} 个直接子元素")
        
        # 包括孙元素（max_depth=2）
        descendants = await container.get_children_elements(max_depth=2)
        print(f"找到 {len(descendants)} 个元素，深度最多为 2 级")
        
        # 按标签名过滤
        links = await container.get_children_elements(
            max_depth=3,
            tag_filter=["a"]
        )
        print(f"在容器中找到 {len(links)} 个链接")
        
        # 组合过滤器以获取特定元素
        nav_links = await container.get_children_elements(
            max_depth=2,
            tag_filter=["a", "button"]
        )

asyncio.run(traverse_children())
```

### 获取兄弟元素

`get_siblings_elements()` 方法查找同一级别的元素：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def traverse_siblings():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/list')
        
        # 查找活动项
        active_item = await tab.find(class_name="item-active")
        
        # 获取所有兄弟元素（不包括 active_item 本身）
        all_siblings = await active_item.get_siblings_elements()
        print(f"活动项有 {len(all_siblings)} 个兄弟元素")
        
        # 按标签过滤兄弟元素
        link_siblings = await active_item.get_siblings_elements(
            tag_filter=["a"]
        )
        
        # 处理兄弟元素
        for sibling in all_siblings:
            text = await sibling.text
            print(f"兄弟元素: {text}")

asyncio.run(traverse_siblings())
```

!!! tip "性能注意事项"
    对于大型树，DOM 遍历可能很昂贵。优先使用较浅的 `max_depth` 值和特定的 `tag_filter` 参数以最小化处理的节点数。对于深度嵌套的结构，考虑使用多个有针对性的 `find()` 调用，而不是单个深度遍历。

## 在元素内查找元素

一旦您有了一个元素，您可以使用相同的 `find()` 和 `query()` 方法在其范围内搜索。

!!! warning "重要：搜索深度行为"
    当您调用 `element.find()` 或 `element.query()` 时，Pydoll 会搜索**所有后代**（子元素、孙元素、曾孙元素等），而不仅仅是直接子元素。这是 `querySelector()` 的标准行为，符合大多数开发人员的期望。

### 理解搜索范围

```mermaid
graph TB
    Container[div id='container']
    
    Container --> Child1[div class='card' ✓]
    Container --> Child2[div class='card' ✓]
    Container --> Child3[div class='other']
    
    Child1 --> GrandChild1[div class='card' ✓]
    Child1 --> GrandChild2[p class='text']
    
    Child3 --> GrandChild3[div class='card' ✓]
    Child3 --> GrandChild4[div class='card' ✓]
```

```python
# 这会在树中找到所有 5 个 class='card' 的元素
# （2 个直接子元素 + 3 个嵌套后代）
cards = await container.find(class_name="card", find_all=True)
print(len(cards))  # 输出：5
```

### 基本范围搜索

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def scoped_search():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/products')
        
        # 查找产品容器
        product_card = await tab.find(class_name="product-card")
        
        # 在产品卡片内搜索（搜索所有后代，仅返回第一个匹配项）
        product_title = await product_card.find(class_name="title")
        product_price = await product_card.find(class_name="price")
        add_button = await product_card.find(tag_name="button", text="Add to Cart")
        
        # 在范围内查询
        product_image = await product_card.query("img.product-image")
        
        # 查找容器内的所有项目（所有后代）
        nav_menu = await tab.find(class_name="nav-menu")
        menu_items = await nav_menu.find(tag_name="li", find_all=True)
        
        print(f"菜单有 {len(menu_items)} 项")

asyncio.run(scoped_search())
```

### 仅查找直接子元素

如果您需要查找**仅直接子元素**（深度 1），请使用 CSS 子组合器 `>` 或 XPath：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def direct_children_only():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/cards')
        
        container = await tab.find(id="cards-container")
        
        # 方法 1：CSS 子组合器（>）
        # 仅查找具有 class='card' 的直接子元素
        direct_cards = await container.query("> .card", find_all=True)
        print(f"直接子元素: {len(direct_cards)}")
        
        # 方法 2：XPath 直接子元素
        direct_divs = await container.query("./div[@class='card']", find_all=True)
        
        # 方法 3：使用 max_depth=1 的 get_children_elements()
        # （但这只按标签过滤，不按其他属性）
        direct_children = await container.get_children_elements(
            max_depth=1,
            tag_filter=["div"]
        )
        
        # 然后按类手动过滤
        cards_only = [
            child for child in direct_children
            if 'card' in (await child.get_attribute('class') or '')
        ]

asyncio.run(direct_children_only())
```

### 比较：find() vs get_children_elements()

| 特性 | `find()` / `query()` | `get_children_elements()` |
|---------|---------------------|---------------------------|
| **搜索深度** | 所有后代 | 使用 `max_depth` 可配置 |
| **过滤依据** | 任何 HTML 属性 | 仅标签名 |
| **用例** | 在子树中的任何位置查找特定元素 | 探索 DOM 结构，获取直接子元素 |
| **性能** | 针对单个属性优化 | 适合广泛探索 |
| **参数** | `tag_name="a"`（字符串） | `tag_filter=["a"]`（列表） |

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def comparison_example():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        container = await tab.find(id="container")
        
        # 场景 1：我想要容器中任何位置的所有链接
        # 使用 find() - 搜索所有后代
        all_links = await container.find(tag_name="a", find_all=True)
        
        # 场景 2：我只想要直接子链接
        # 使用 CSS 子组合器
        direct_links = await container.query("> a", find_all=True)
        
        # 场景 3：我想要具有特定类的直接子元素
        # 使用 CSS 子组合器
        direct_cards = await container.query("> .card", find_all=True)
        
        # 场景 4：我想探索 DOM 结构
        # 使用 get_children_elements()
        direct_children = await container.get_children_elements(max_depth=1)
        
        # 场景 5：我想要深度最多为 2 的所有后代，按标签过滤
        # 使用 get_children_elements()
        shallow_links = await container.get_children_elements(
            max_depth=2,
            tag_filter=["a"]
        )

asyncio.run(comparison_example())
```

!!! tip "何时使用每种方法"
    - **使用 `find()`**：当您知道属性（class、id 等）并想搜索整个子树时
    - **使用 `query("> .class")`**：当您只需要具有特定属性的直接子元素时
    - **使用 `get_children_elements()`**：当探索 DOM 结构或仅按标签过滤时

### 常见用例

这种范围搜索对于处理重复模式非常有用，例如：

- 电子商务网站中的产品卡片
- 具有多个单元格的表格行
- 具有多个字段的表单部分
- 具有嵌套项的导航菜单

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def practical_example():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/products')
        
        # 查找页面上的所有产品卡片
        product_cards = await tab.find(class_name="product-card", find_all=True)
        
        for card in product_cards:
            # 在每个卡片内，查找具有这些类的所有后代
            title = await card.find(class_name="product-title")
            price = await card.find(class_name="product-price")
            
            # 获取此卡片内任何位置的按钮
            buy_button = await card.find(tag_name="button", text="Buy Now")
            
            title_text = await title.text
            price_text = await price.text
            
            print(f"产品: {title_text}, 价格: {price_text}")
            
            # 点击购买按钮
            await buy_button.click()

asyncio.run(practical_example())
```

## Shadow DOM 支持

许多现代 Web 应用程序使用 [Shadow DOM](https://developer.mozilla.org/zh-CN/docs/Web/API/Web_components/Using_shadow_DOM) 来封装组件内部结构。Pydoll 通过 `ShadowRoot` 类提供对 shadow 树内元素的无缝访问。

### Shadow DOM 的工作原理

```mermaid
graph TB
    Host["div#my-component (shadow host)"]
    SR["ShadowRoot (open)"]
    Internal1["button.internal-btn"]
    Internal2["input.internal-input"]

    Host --> SR
    SR --> Internal1
    SR --> Internal2
```

shadow root 内的元素对常规 DOM 查询是隐藏的。您需要先访问 shadow root，然后在其中进行搜索。

### 访问 Shadow Root

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def shadow_dom_example():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/web-components')

        # 查找 shadow host 元素
        shadow_host = await tab.find(id='my-component')

        # 访问其 shadow root
        shadow_root = await shadow_host.get_shadow_root()

        # 在 shadow root 内使用 query() 和 CSS 选择器查找元素
        button = await shadow_root.query('.internal-btn')
        await button.click()

        input_field = await shadow_root.query('input[type="email"]')
        await input_field.type_text('user@example.com')

asyncio.run(shadow_dom_example())
```

### 使用 query() 和 CSS 选择器

`ShadowRoot` 继承自 `FindElementsMixin`，但带有 `_css_only` 限制，这意味着仅支持使用 CSS 选择器的 `query()`。`find()` 方法和使用 XPath 的 `query()` 会抛出 `NotImplementedError`：

```python
# query() 配合 CSS 选择器 — 推荐方法
element = await shadow_root.query('#inner-id')
element = await shadow_root.query('button.primary')
element = await shadow_root.query('div.container > .content')

# find_all 查找多个元素
items = await shadow_root.query('.item', find_all=True)

# 带超时的等待
element = await shadow_root.query('#dynamic', timeout=5)
```

!!! warning "ShadowRoot 不支持 find() 和 XPath"
    调用 `shadow_root.find()` 或 `shadow_root.query('//xpath')` 会抛出 `NotImplementedError`。在 shadow root 中请始终使用带 CSS 选择器的 `query()`。

### 嵌套 Shadow Root

Web 组件可以包含拥有自己 shadow root 的其他 Web 组件：

```python
async def nested_shadow():
    outer_host = await tab.find(tag_name='outer-component')
    outer_shadow = await outer_host.get_shadow_root()

    inner_host = await outer_shadow.query('inner-component')
    inner_shadow = await inner_host.get_shadow_root()

    deep_button = await inner_shadow.query('.deep-btn')
    await deep_button.click()
```

### 查找 Shadow Root：find_shadow_roots()

当您需要探索页面上存在哪些 shadow root（对调试或 Cloudflare 挑战等动态页面很有用）时，使用 `find_shadow_roots()`：

```python
# 查找页面上的所有 shadow root
shadow_roots = await tab.find_shadow_roots()

for sr in shadow_roots:
    print(f'模式: {sr.mode}, 宿主: {sr.host_element}')
    # 在每个 shadow root 内搜索
    btn = await sr.query('button', raise_exc=False)
    if btn:
        await btn.click()
```

#### 等待 Shadow Root：`timeout`

Shadow 宿主通常是异步注入的（例如 Cloudflare Turnstile 在 OOPIF 中加载）。使用 `timeout` 进行轮询直到 shadow root 出现：

```python
# 等待最多 10 秒让 shadow root 出现
shadow_roots = await tab.find_shadow_roots(timeout=10)
```

元素上的 `get_shadow_root()` 方法也支持 `timeout`：

```python
# 等待元素的 shadow root 出现
host = await tab.find(id='my-component', timeout=5)
shadow = await host.get_shadow_root(timeout=5)
```

#### 深度遍历：跨域 IFrame（OOPIF）

默认情况下，`find_shadow_roots()` 仅遍历主文档的 DOM 树（包括通过 `contentDocument` 访问的同源 iframe，但**不包括**跨域 iframe）。传入 `deep=True` 以同时发现跨域 iframe（OOPIF）内的 shadow root：

```python
# 包含跨域 iframe 中的 shadow root（例如 Cloudflare Turnstile）
shadow_roots = await tab.find_shadow_roots(deep=True, timeout=10)

for sr in shadow_roots:
    print(f'模式: {sr.mode}, 宿主: {sr.host_element}')
    # 在这些 shadow root 中找到的元素会自动通过
    # 正确的 OOPIF 会话路由 CDP 命令
    btn = await sr.query('input[type="checkbox"]', raise_exc=False)
    if btn:
        await btn.click()
```

!!! tip "何时使用 `deep=True`"
    在自动化包含跨域嵌入式组件的页面时使用 `deep=True`，例如 Cloudflare Turnstile 验证码、第三方支付表单或社交登录按钮。这些组件通常使用跨域 iframe，其中包含关闭的 shadow root。

### Shadow Root 属性

```python
shadow_root = await element.get_shadow_root()

# 检查 shadow root 模式（open、closed 或 user-agent）
print(shadow_root.mode)  # ShadowRootType.OPEN

# 访问 host 元素
host = shadow_root.host_element

# 获取 shadow root 内部 HTML
html = await shadow_root.inner_html
```

!!! note "关闭的 Shadow Root"
    关闭的 shadow root（`mode='closed'`）可以通过 CDP 访问，因为协议绕过了 JavaScript 限制。但是，某些浏览器内部的 shadow root（user-agent）可能具有有限的可访问性。

## 使用 iFrame

!!! info "提供完整的 IFrame 指南"
    本节介绍用于元素查找的基本 iframe 交互。有关包括嵌套 iframe、CAPTCHA 处理、技术深入探讨和故障排除的综合指南，请参阅**[使用 IFrame](automation/iframes.md)**。

iFrame 在浏览器自动化中提出了特殊的挑战，因为它们具有单独的 DOM 上下文。Pydoll 使 iframe 交互无缝：

### iFrame 上下文隔离

```mermaid
flowchart TB
    Main[tab]
    Frame["iframe WebElement"]
    Content["iframe 内部元素"]

    Main -->|"find('iframe')"| Frame
    Frame -->|"find('button#submit')"| Content
```
```python
import asyncio
from pydoll.browser.chromium import Chrome

async def iframe_interaction():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com/page-with-iframe')

        iframe = await tab.query("iframe.embedded-content", timeout=10)

        # WebElement 辅助方法会自动在 iframe 内执行
        iframe_button = await iframe.find(tag_name="button", class_name="submit")
        await iframe_button.click()

        iframe_input = await iframe.find(id="captcha-input")
        await iframe_input.type_text("verification-code")

        # 如果还有内层 iframe，继续链式查找
        inner_iframe = await iframe.find(tag_name="iframe")
        download_link = await inner_iframe.find(text="下载 PDF")
        await download_link.click()

asyncio.run(iframe_interaction())
```
!!! note "iframe 中的截图"
    `tab.take_screenshot()` 只能作用于顶层 target。想要截取 iframe 内容，请锁定 iframe 内部的某个元素，使用 `element.take_screenshot()`。

## 错误处理策略

健壮的自动化需要处理元素不存在或出现时间超过预期的情况。

### 元素查找流程与错误处理

```mermaid
flowchart TB
    Start[开始查找元素] --> Immediate[尝试立即查找]
    
    Immediate --> Found1{找到元素?}
    Found1 -->|是| Return1[返回 WebElement]
    Found1 -->|否 & timeout=0| Check1{raise_exc=True?}
    Found1 -->|否 & timeout>0| Wait[开始等待循环]
    
    Check1 -->|是| Error1[抛出 ElementNotFound]
    Check1 -->|否| ReturnNone[返回 None]
    
    Wait --> Sleep[等待 0.5 秒]
    Sleep --> TryAgain[再次尝试查找]
    TryAgain --> Found2{找到元素?}
    
    Found2 -->|是| Return2[返回 WebElement]
    Found2 -->|否| TimeCheck{超时?}
    
    TimeCheck -->|否| Sleep
    TimeCheck -->|是| Check2{raise_exc=True?}
    
    Check2 -->|是| Error2[抛出 WaitElementTimeout]
    Check2 -->|否| ReturnNone2[返回 None]
```

### 使用 raise_exc 参数

控制在未找到元素时是否抛出异常：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.exceptions import ElementNotFound

async def error_handling():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
        
        # 如果未找到则抛出异常（默认行为）
        try:
            critical_element = await tab.find(id="must-exist")
        except ElementNotFound:
            print("缺少关键元素！无法继续。")
            return
        
        # 如果未找到则返回 None（可选元素）
        optional_banner = await tab.find(
            class_name="promo-banner",
            raise_exc=False
        )
        
        if optional_banner:
            print("找到横幅，正在关闭它")
            close_button = await optional_banner.find(class_name="close-btn")
            await close_button.click()
        else:
            print("没有横幅，继续")

asyncio.run(error_handling())
```

## 最佳实践

### 1. 优先使用稳定的选择器

使用不太可能改变的属性：

```python
# 好：语义属性
await tab.find(id="user-profile")  # ID 通常是稳定的
await tab.find(data_testid="submit-button")  # 测试 ID 专为自动化设计
await tab.find(name="username")  # 表单名称是稳定的

# 避免：结构依赖
await tab.query("div > div > div:nth-child(3) > input")  # 脆弱，容易损坏
```

### 2. 使用最简单的有效选择器

从简单开始，仅在需要时添加复杂性：

```python
# 好：简单明了
await tab.find(id="login-form")

# 不必要：过于复杂
await tab.query("//div[@id='content']/descendant::form[@id='login-form']")
```

### 3. 选择正确的方法

- 使用 `find()` 进行简单的基于属性的搜索
- 使用 `query()` 进行复杂的 CSS 或 XPath 模式
- 使用遍历方法从已知锚点探索

```python
# 使用 find() 处理简单情况
username = await tab.find(id="username")

# 使用 query() 处理复杂模式
active_nav_link = await tab.query("nav.menu a.active")

# 使用遍历进行基于关系的搜索
container = await tab.find(id="cards")
child_links = await container.get_children_elements(tag_filter=["a"])
```

### 4. 添加有意义的超时

不要对动态内容使用零超时，也不要永远等待可选元素：

```python
# 好：合理的超时
critical_data = await tab.find(id="data", timeout=10)
optional_popup = await tab.find(class_name="popup", timeout=2, raise_exc=False)

# 坏：动态内容没有超时
dynamic_element = await tab.find(class_name="ajax-loaded")  # 会立即失败

# 坏：可选元素的超时时间太长
banner = await tab.find(class_name="ad-banner", timeout=60)  # 浪费时间
```

### 5. 优雅地处理错误

为可能不存在的元素制定计划：

```python
# 关键元素：让异常冒泡
submit_button = await tab.find(id="submit-btn")

# 可选元素：显式处理
cookie_notice = await tab.find(class_name="cookie-notice", raise_exc=False)
if cookie_notice:
    accept_button = await cookie_notice.find(text="Accept")
    await accept_button.click()
```

## 完整示例：表单自动化

这是一个结合多种元素查找技术的完整示例：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.exceptions import ElementNotFound

async def automate_registration_form():
    async with Chrome() as browser:
        tab = await browser.start()
        
        try:
            # 导航到注册页面
            await tab.go_to('https://example.com/register', timeout=10)
            
            # 处理可选的 cookie 横幅
            cookie_banner = await tab.find(
                class_name="cookie-banner",
                timeout=2,
                raise_exc=False
            )
            if cookie_banner:
                accept = await cookie_banner.find(text="Accept")
                await accept.click()
                await asyncio.sleep(1)
            
            # 填写注册表单
            # 查找表单字段
            username_field = await tab.find(name="username", timeout=5)
            email_field = await tab.find(name="email")
            password_field = await tab.find(type="password", name="password")
            confirm_password = await tab.find(type="password", name="confirm_password")
            
            # 输入信息
            await username_field.type_text("john_doe_2024", interval=0.1)
            await email_field.type_text("john@example.com", interval=0.1)
            await password_field.type_text("SecurePass123!", interval=0.1)
            await confirm_password.type_text("SecurePass123!", interval=0.1)
            
            # 查找并勾选条款复选框
            # 尝试多种策略
            terms_checkbox = await tab.find(id="terms", raise_exc=False)
            if not terms_checkbox:
                terms_checkbox = await tab.find(name="accept_terms", raise_exc=False)
            if not terms_checkbox:
                terms_checkbox = await tab.query("input[type='checkbox']")
            
            await terms_checkbox.click()
            
            # 查找并点击提交按钮
            submit_button = await tab.find(
                tag_name="button",
                type="submit",
                timeout=2
            )
            await submit_button.click()
            
            # 等待成功消息，超时时间更长（表单处理）
            success_message = await tab.find(
                class_name="success-message",
                timeout=15
            )
            
            message_text = await success_message.text
            print(f"注册成功: {message_text}")
            
            # 验证重定向到仪表板
            await asyncio.sleep(2)
            current_url = await tab.current_url
            
            if "dashboard" in current_url:
                print("成功重定向到仪表板")
                
                # 查找欢迎消息
                welcome = await tab.find(class_name="welcome-message", timeout=5)
                welcome_text = await welcome.text
                print(f"欢迎消息: {welcome_text}")
            else:
                print(f"注册后的意外 URL: {current_url}")
                
        except ElementNotFound as e:
            print(f"元素未找到: {e}")
            # 为调试截图
            await tab.take_screenshot("error_screenshot.png")
        except Exception as e:
            print(f"意外错误: {e}")
            await tab.take_screenshot("unexpected_error.png")

asyncio.run(automate_registration_form())
```

## 了解更多

想深入了解元素查找？

- **[FindElements Mixin 深入探讨](../deep-dive/find-elements-mixin.md)**：了解架构、内部选择器策略和性能优化
- **[选择器指南](../deep-dive/selectors-guide.md)**：CSS 选择器和 XPath 的综合指南，包含语法参考和实际示例
- **[WebElement 域](../deep-dive/webelement-domain.md)**：了解找到元素后可以对元素执行的操作

元素查找是成功的浏览器自动化的基础。掌握这些技术，您将能够可靠地定位任何网页上的任何元素，无论结构多么复杂。

================================================
FILE: docs/zh/features/index.md
================================================
# 功能指南

欢迎来到 Pydoll 的综合功能文档！在这里，您将发现使 Pydoll 成为强大而灵活的浏览器自动化工具的一切。无论您是刚刚入门还是希望利用高级功能，您都将找到每个功能的详细指南、实用示例和最佳实践。

## 您将在这里找到什么

本指南按照逻辑部分组织，反映了您的自动化之旅：从基本概念到高级技术。每个页面都设计为独立的，因此您可以直接跳转到您感兴趣的内容，或者按顺序学习。

## 核心概念

在深入了解特定功能之前，值得了解是什么使 Pydoll 与众不同。这些基础概念决定了整个库的工作方式。

**[核心概念](core-concepts.md)**：探索使 Pydoll 与众不同的架构决策：零 WebDriver 方法消除了兼容性问题，异步优先设计实现了真正的并发操作，以及对多个基于 Chromium 的浏览器的原生支持。

## 元素查找和交互

查找页面元素并与之交互是自动化的基础。Pydoll 通过现代化的 API 使这一过程变得出奇地直观。

**[元素查找](element-finding.md)**：掌握 Pydoll 的元素定位策略，从使用自然 HTML 属性的直观 `find()` 方法，到用于 CSS 选择器和 XPath 的强大 `query()` 方法。您还将学习 DOM 遍历辅助工具，让您高效地导航页面结构。

## 自动化能力

这些功能使您的自动化栩栩如生：模拟用户交互、键盘控制、处理文件操作、使用 iframe 以及捕获视觉内容。

**[类人交互](automation/human-interactions.md)**：学习如何创建真正感觉像人类的交互：具有自然时间变化的打字、具有真实鼠标移动的点击，以及像真实用户一样使用键盘快捷键。这对于避免在自动化敏感站点中被检测至关重要。

**[键盘控制](automation/keyboard-control.md)**：掌握键盘交互，全面支持组合键、修饰键和特殊键。对于表单、快捷键和可访问性测试至关重要。

**[文件操作](automation/file-operations.md)**：文件处理在浏览器自动化中可能很棘手。Pydoll 为上传和下载提供了强大的解决方案，`expect_download` 上下文管理器提供了优雅的异步下载完成处理。

**[IFrame 交互](automation/iframes.md)**：把 iframe 当成普通元素——定位 iframe 后在其内部继续查找，无需额外 target 或 Tab。

**[截图和 PDF](automation/screenshots-and-pdfs.md)**：从您的自动化会话中捕获视觉内容。无论您需要用于视觉回归测试的整页截图、用于调试的元素特定捕获，还是用于归档的 PDF 导出，Pydoll 都能满足您的需求。

## 网络功能

Pydoll 的网络功能是它真正出色的地方，为您提供前所未有的 HTTP 流量可见性和控制。

**[网络监控](network/monitoring.md)**：观察和分析浏览器会话中的所有网络活动。提取 API 响应、跟踪请求时间、识别失败的请求，并准确了解正在交换的数据。对于调试、测试和数据提取至关重要。

**[请求拦截](network/interception.md)**：超越观察，主动修改网络行为。阻止不需要的资源、注入自定义标头、修改请求负载，甚至使用模拟数据满足请求。这对于测试、优化和隐私控制非常强大。

**[浏览器上下文 HTTP 请求](network/http-requests.md)**：发出在浏览器的 JavaScript 上下文中执行的 HTTP 请求，自动继承会话状态、cookie 和身份验证。这种混合方法结合了 Python 的 `requests` 库的熟悉性与浏览器上下文执行的优势。

## 浏览器管理

有效的浏览器和标签页管理对于复杂的自动化场景、并行处理和多用户测试至关重要。

**[多标签页管理](browser-management/tabs.md)**：同时使用多个浏览器标签页，确保高效的资源使用，同时让您完全控制标签页生命周期、检测用户打开的标签页以及并发抓取操作。

**[浏览器上下文](browser-management/contexts.md)**：在单个浏览器进程内创建完全隔离的浏览环境。每个上下文维护单独的 cookie、存储、缓存和权限：非常适合多账户测试、A/B 测试或使用不同配置的并行抓取。

**[Cookie 和会话](browser-management/cookies-sessions.md)**：在浏览器和标签页级别管理会话状态。以编程方式设置 cookie、提取会话数据，并在浏览器上下文中维护不同的会话以进行复杂的测试场景。

## 配置

自定义浏览器行为的各个方面以匹配您的自动化需求，从低级 Chromium 首选项到命令行参数和页面加载策略。

**[浏览器选项](configuration/browser-options.md)**：配置 Chromium 的启动参数、命令行参数和页面加载状态控制。微调浏览器行为、启用实验性功能，并针对您的自动化需求优化性能。

**[浏览器首选项](configuration/browser-preferences.md)**：直接访问 Chromium 的内部首选项系统，让您控制数百个设置。配置下载、禁用功能、优化性能，或为隐蔽自动化创建真实的浏览器指纹。

**[代理配置](configuration/proxy.md)**：具有完整身份验证功能的原生代理支持。对于需要 IP 轮换、地理定向测试或注重隐私的自动化的网络抓取项目至关重要。

## 高级功能

这些复杂的功能解决了复杂的自动化挑战和专门的用例。

**[行为验证码绕过](advanced/behavioral-captcha-bypass.md)**：Pydoll 的原生行为验证码处理是其最受欢迎的功能之一。学习如何使用两种方法与 Cloudflare Turnstile、reCAPTCHA v3 和 hCaptcha 隐形挑战进行交互 - 用于保证完成的同步上下文管理器，以及用于非阻塞操作的后台处理。

**[事件系统](advanced/event-system.md)**：构建响应实时浏览器事件的响应式自动化。监控页面加载、网络活动、DOM 更改和 JavaScript 执行，以创建智能、自适应的自动化脚本。

**[远程连接](advanced/remote-connections.md)**：通过 WebSocket 连接到已运行的浏览器以实现混合自动化场景。非常适合 CI/CD 管道、容器化环境或将 Pydoll 集成到现有的 CDP 工具中。

## 如何使用本指南

每个功能页面遵循一致的结构：

1. **概述** - 功能的作用及其重要性
2. **基本用法** - 通过简单示例快速入门
3. **高级模式** - 充分利用功能的潜力
4. **最佳实践** - 有效和高效使用的技巧
5. **常见陷阱** - 从常见错误中学习

您可以根据需要以任何顺序探索功能。代码示例是完整的并且可以直接运行 - 只需复制、粘贴并适应您的用例。

准备深入了解 Pydoll 的功能了吗？选择一个您感兴趣的功能，开始探索吧！🚀

================================================
FILE: docs/zh/features/network/http-requests.md
================================================
# 浏览器上下文 HTTP 请求

发起自动继承浏览器会话状态、Cookie 和身份验证的 HTTP 请求。非常适合结合 UI 导航和 API 效率的混合自动化。

!!! tip "混合自动化的游戏规则改变者"
    曾经希望您可以发起自动获取所有浏览器 Cookie 和身份验证的 HTTP 请求吗？现在您可以了！`tab.request` 属性为您提供了一个漂亮的类似 `requests` 的接口，可以**直接在浏览器的 JavaScript 上下文中**执行 HTTP 调用。

## 为什么使用浏览器上下文请求？

传统自动化通常需要您手动提取 Cookie 和标头以进行 API 调用。浏览器上下文请求消除了这种麻烦：

| 传统方法 | 浏览器上下文请求 |
|---------------------|-------------------------|
| 手动提取 Cookie | Cookie 自动继承 |
| 管理会话令牌 | 会话状态保留 |
| 单独处理 CORS | 遵守 CORS 策略 |
| 同时使用两个 HTTP 客户端 | 一个统一的接口 |
| 同步身份验证状态 | 始终已认证 |

**非常适合：**

- 通过 UI 登录后抓取已认证的 API
- 混合工作流，混合浏览器交互和 API 调用
- 测试已认证的端点而无需管理令牌
- 绕过复杂的身份验证流程
- 使用单页应用程序（SPA）

## 快速入门

最简单的示例：通过 UI 登录，然后进行已认证的 API 调用：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def hybrid_automation():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # 1. 通过 UI 正常登录
        await tab.go_to('https://example.com/login')
        await (await tab.find(id='username')).type_text('user@example.com')
        await (await tab.find(id='password')).type_text('password123')
        await (await tab.find(id='login-btn')).click()
        
        # 登录后等待重定向
        await asyncio.sleep(2)
        
        # 2. 现在使用已认证的会话进行 API 调用！
        response = await tab.request.get('https://example.com/api/user/profile')
        user_data = response.json()
        
        print(f"登录为: {user_data['name']}")
        print(f"邮箱: {user_data['email']}")

asyncio.run(hybrid_automation())
```

!!! success "无需 Cookie 管理"
    注意我们没有提取或传递任何 Cookie？请求自动继承了浏览器的已认证会话！

## 常见用例

### 1. 抓取已认证的 API

使用 UI 登录，然后使用 API 提取数据：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def scrape_user_data():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # 通过 UI 登录（处理复杂的认证流程）
        await tab.go_to('https://app.example.com/login')
        await (await tab.find(id='email')).type_text('user@example.com')
        await (await tab.find(id='password')).type_text('password')
        await (await tab.find(type='submit')).click()
        await asyncio.sleep(2)
        
        # 现在通过 API 提取数据（比抓取 UI 快得多）
        all_users = []
        for page in range(1, 6):
            response = await tab.request.get(
                f'https://app.example.com/api/users',
                params={'page': str(page), 'limit': '100'}
            )
            users = response.json()['users']
            all_users.extend(users)
            print(f"第 {page} 页: 获取了 {len(users)} 个用户")
        
        print(f"抓取的总用户数: {len(all_users)}")

asyncio.run(scrape_user_data())
```

### 2. 测试受保护的端点

测试 API 端点而无需管理身份验证令牌：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def test_api_endpoints():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # 一次性认证
        await tab.go_to('https://api.example.com/login')
        # ... 执行登录 ...
        await asyncio.sleep(2)
        
        # 测试多个端点
        endpoints = [
            '/api/users/me',
            '/api/settings',
            '/api/notifications',
            '/api/dashboard/stats'
        ]
        
        for endpoint in endpoints:
            response = await tab.request.get(f'https://api.example.com{endpoint}')
            
            if response.ok:
                print(f"成功 {endpoint}: {response.status_code}")
            else:
                print(f"失败 {endpoint}: {response.status_code}")
                print(f"   错误: {response.text[:100]}")

asyncio.run(test_api_endpoints())
```

### 3. 通过 API 提交表单

通过直接向 API 发送来更快地填充表单：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def bulk_form_submission():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # 首先登录
        await tab.go_to('https://crm.example.com/login')
        # ... 登录逻辑 ...
        await asyncio.sleep(2)
        
        # 通过 API 提交多个条目（比填写表单快得多）
        contacts = [
            {'name': 'John Doe', 'email': 'john@example.com', 'company': 'Acme Inc'},
            {'name': 'Jane Smith', 'email': 'jane@example.com', 'company': 'Tech Corp'},
            {'name': 'Bob Wilson', 'email': 'bob@example.com', 'company': 'StartupXYZ'},
        ]
        
        for contact in contacts:
            response = await tab.request.post(
                'https://crm.example.com/api/contacts',
                json=contact
            )
            
            if response.ok:
                print(f"已添加: {contact['name']}")
            else:
                print(f"失败: {contact['name']} - {response.status_code}")

asyncio.run(bulk_form_submission())
```

### 4. 使用会话下载文件

下载需要身份验证的文件：

```python
import asyncio
from pathlib import Path
from pydoll.browser.chromium import Chrome

async def download_authenticated_file():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # 认证
        await tab.go_to('https://portal.example.com/login')
        # ... 登录逻辑 ...
        await asyncio.sleep(2)
        
        # 下载需要身份验证的文件
        response = await tab.request.get(
            'https://portal.example.com/api/reports/monthly.pdf'
        )
        
        if response.ok:
            # 保存文件
            output_path = Path('/tmp/monthly_report.pdf')
            output_path.write_bytes(response.content)
            print(f"已下载: {output_path} ({len(response.content)} 字节)")
        else:
            print(f"下载失败: {response.status_code}")

asyncio.run(download_authenticated_file())
```

### 5. 使用自定义标头

向您的请求添加自定义标头：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.types import HeaderEntry

async def custom_headers_example():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # 首先登录
        await tab.go_to('https://api.example.com/login')
        # ... 登录逻辑 ...
        
        # 使用自定义标头发起请求
        headers: list[HeaderEntry] = [
            {'name': 'X-API-Version', 'value': '2.0'},
            {'name': 'X-Request-ID', 'value': 'unique-id-123'},
            {'name': 'Accept-Language', 'value': 'pt-BR,pt;q=0.9'},
        ]
        
        response = await tab.request.get(
            'https://api.example.com/data',
            headers=headers
        )
        
        print(f"状态: {response.status_code}")
        print(f"数据: {response.json()}")

asyncio.run(custom_headers_example())
```

### 6. 处理不同的响应类型

以多种格式访问响应数据：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def response_formats():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://api.example.com')
        
        # JSON 响应
        json_response = await tab.request.get('/api/users/1')
        user = json_response.json()
        print(f"JSON: {user}")
        
        # 文本响应
        text_response = await tab.request.get('/api/status')
        status_text = text_response.text
        print(f"文本: {status_text}")
        
        # 二进制响应（例如，图像）
        image_response = await tab.request.get('/api/avatar/1')
        image_bytes = image_response.content
        print(f"二进制: {len(image_bytes)} 字节")
        
        # 检查响应状态
        if json_response.ok:
            print("请求成功！")
        
        # 访问响应 URL（在重定向后很有用）
        print(f"最终 URL: {json_response.url}")

asyncio.run(response_formats())
```

## HTTP 方法

支持所有标准的 HTTP 方法：

### GET - 检索数据

```python
# 简单的 GET
response = await tab.request.get('https://api.example.com/users')

# 带查询参数的 GET
response = await tab.request.get(
    'https://api.example.com/search',
    params={'q': 'python', 'limit': '10'}
)
```

### POST - 创建资源

```python
# 使用 JSON 数据的 POST
response = await tab.request.post(
    'https://api.example.com/users',
    json={'name': 'John Doe', 'email': 'john@example.com'}
)

# 使用表单数据的 POST
response = await tab.request.post(
    'https://api.example.com/login',
    data={'username': 'john', 'password': 'secret'}
)
```

### PUT - 更新资源

```python
# 更新整个资源
response = await tab.request.put(
    'https://api.example.com/users/123',
    json={'name': 'Jane Doe', 'email': 'jane@example.com', 'role': 'admin'}
)
```

### PATCH - 部分更新

```python
# 更新特定字段
response = await tab.request.patch(
    'https://api.example.com/users/123',
    json={'email': 'newemail@example.com'}
)
```

### DELETE - 删除资源

```python
# 删除资源
response = await tab.request.delete('https://api.example.com/users/123')
```

### HEAD - 仅获取标头

```python
# 检查资源是否存在而不下载它
response = await tab.request.head('https://example.com/large-file.zip')
print(f"Content-Length: {response.headers}")
```

### OPTIONS - 检查功能

```python
# 检查允许的方法
response = await tab.request.options('https://api.example.com/users')
print(f"允许的方法: {response.headers}")
```

!!! info "这是如何工作的？"
    浏览器上下文请求使用 Fetch API 直接在浏览器的 JavaScript 上下文中执行 HTTP 调用，同时监控 CDP 网络事件以捕获全面的元数据（标头、Cookie、时序）。
    
    有关内部架构、事件监控和实现详细信息的详细说明，请参阅[浏览器请求架构](../../deep-dive/browser-requests-architecture.md)。

## 响应对象

`Response` 对象提供了类似于 `requests.Response` 的熟悉接口：

```python
response = await tab.request.get('https://api.example.com/users')

# 状态码
print(response.status_code)  # 200, 404, 500 等

# 检查是否成功（2xx 或 3xx）
if response.ok:
    print("成功！")

# 响应体
text_data = response.text      # 作为字符串
byte_data = response.content   # 作为字节
json_data = response.json()    # 解析的 JSON

# 标头
for header in response.headers:
    print(f"{header['name']}: {header['value']}")

# 请求标头（实际发送的内容）
for header in response.request_headers:
    print(f"{header['name']}: {header['value']}")

# 响应设置的 Cookie
for cookie in response.cookies:
    print(f"{cookie['name']} = {cookie['value']}")

# 最终 URL（在重定向后）
print(response.url)

# 为错误状态码引发异常
response.raise_for_status()  # 如果是 4xx 或 5xx 则引发 HTTPError
```

!!! note "重定向和 URL 跟踪"
    `response.url` 属性仅包含所有重定向后的**最终 URL**。如果您需要跟踪完整的重定向链（中间 URL、状态码、时序），请使用[网络监控](monitoring.md)详细观察所有请求。

## 标头和 Cookie

### 使用标头

标头表示为 `HeaderEntry` 对象：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.types import HeaderEntry

async def header_example():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # 使用 HeaderEntry 类型以获得 IDE 自动完成和类型检查
        headers: list[HeaderEntry] = [
            {'name': 'Authorization', 'value': 'Bearer token-123'},
            {'name': 'X-Custom-Header', 'value': 'custom-value'},
        ]
        
        response = await tab.request.get(
            'https://api.example.com/protected',
            headers=headers
        )
        
        # 检查响应标头（也是 HeaderEntry 类型的字典）
        for header in response.headers:
            if header['name'] == 'Content-Type':
                print(f"Content-Type: {header['value']}")

asyncio.run(header_example())
```

!!! tip "标头的类型提示"
    `HeaderEntry` 是来自 `pydoll.protocol.fetch.types` 的 `TypedDict`。将其用作类型提示可为您提供：
    
    - **自动完成**：IDE 建议 `name` 和 `value` 键
    - **类型安全**：在运行前捕获拼写错误和缺失的键
    - **文档**：清晰的标头结构
    
    虽然您可以传递普通字典，但使用类型提示可以提高代码质量和 IDE 支持。

!!! tip "自定义标头行为"
    自定义标头与浏览器的自动标头（如 `User-Agent`、`Accept`、`Referer` 等）**一起**发送。
    
    如果您尝试设置标准浏览器标头（例如 `User-Agent`），行为取决于特定标头；有些可能会被覆盖，其他可能被忽略，有些可能会导致冲突。对于大多数用例，坚持使用自定义标头（例如 `X-API-Key`、`Authorization`）以避免意外行为。

### 理解 Cookie

Cookie 由浏览器自动管理：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def cookie_example():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # 第一个请求设置 Cookie
        login_response = await tab.request.post(
            'https://api.example.com/login',
            json={'username': 'user', 'password': 'pass'}
        )
        
        # 检查服务器设置的 Cookie
        print("服务器设置的 Cookie：")
        for cookie in login_response.cookies:
            print(f"  {cookie['name']} = {cookie['value']}")
        
        # 后续请求自动包含 Cookie
        profile_response = await tab.request.get(
            'https://api.example.com/profile'
        )
        # 无需传递 Cookie - 浏览器会处理！
        
        print(f"配置文件数据: {profile_response.json()}")

asyncio.run(cookie_example())
```

## 与传统 Requests 的比较

| 功能 | `requests` 库 | 浏览器上下文请求 |
|---------|-------------------|-------------------------|
| **会话管理** | 手动 Cookie 处理 | 通过浏览器自动 |
| **身份验证** | 提取并传递令牌 | 从浏览器继承 |
| **CORS** | 不适用 | 浏览器执行策略 |
| **JavaScript** | 无法执行 | 完全访问浏览器上下文 |
| **Cookie Jar** | 单独的实例 | 浏览器的原生 Cookie 存储 |
| **标头** | 手动设置 | 浏览器自动添加标准标头 |
| **用例** | 服务器端脚本 | 浏览器自动化 |
| **设置** | 外部库 | 内置于 Pydoll |

## 另请参阅

- **[浏览器请求架构](../../deep-dive/browser-requests-architecture.md)** - 内部实现和架构
- **[网络监控](monitoring.md)** - 观察所有网络流量
- **[请求拦截](interception.md)** - 在发送前修改请求
- **[事件系统](../advanced/event-system.md)** - 对浏览器事件做出反应
- **[深入了解：网络功能](../../deep-dive/network-capabilities.md)** - 技术细节

浏览器上下文请求是混合自动化的游戏规则改变者。结合 UI 自动化的强大功能和直接 API 调用的速度，同时保持完美的会话连续性！


================================================
FILE: docs/zh/features/network/interception.md
================================================
# 请求拦截

请求拦截允许您实时拦截、修改、阻止或模拟 HTTP 请求和响应。这对于测试、性能优化、内容过滤和模拟各种网络条件至关重要。

!!! info "Network 域与 Fetch 域"
    **Network 域**用于被动监控（观察流量）。**Fetch 域**用于主动拦截（修改/阻止请求）。本指南专注于拦截。有关被动监控，请参阅[网络监控](monitoring.md)。

## 理解请求拦截

当您启用请求拦截时，Pydoll 会在匹配的请求发送到服务器之前（或接收响应之后）暂停它们。然后您有三个选项：

1. **继续**：让请求继续（可选择性地进行修改）
2. **阻止**：使请求失败并返回错误
3. **模拟**：使用自定义响应满足请求

```mermaid
sequenceDiagram
    participant Browser
    participant Pydoll
    participant Server
    
    Browser->>Pydoll: 发起请求
    Note over Pydoll: 请求已暂停
    Pydoll->>Pydoll: 执行回调
    
    alt 继续
        Pydoll->>Server: 转发请求
        Server-->>Browser: 响应
    else 阻止
        Pydoll-->>Browser: 错误响应
    else 模拟
        Pydoll-->>Browser: 自定义响应
    end
```

!!! warning "性能影响"
    请求拦截会为每个匹配的请求增加延迟。只拦截您需要的内容，完成后禁用以避免减慢页面加载速度。

## 启用请求拦截

在拦截请求之前，您必须启用 Fetch 域：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def main():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # 启用 fetch 事件（默认拦截所有请求）
        await tab.enable_fetch_events()
        
        await tab.go_to('https://example.com')
        
        # 完成后禁用
        await tab.disable_fetch_events()

asyncio.run(main())
```

### 选择性拦截

您可以按资源类型过滤要拦截的请求：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def selective_interception():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # 仅拦截图片和样式表
        await tab.enable_fetch_events(
            resource_type='Image'  # 或 'Stylesheet'、'Script' 等
        )
        
        await tab.go_to('https://example.com')
        await tab.disable_fetch_events()

asyncio.run(selective_interception())
```

!!! tip "资源类型"
    参见[资源类型参考](#resource-types-reference)部分以获取可拦截资源类型的完整列表。

## 拦截请求

使用 `RequestPaused` 事件来拦截请求：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent

async def basic_interception():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # 带有类型提示的回调以获得 IDE 支持
        async def handle_request(event: RequestPausedEvent):
            request_id = event['params']['requestId']
            url = event['params']['request']['url']
            
            print(f"已拦截: {url}")
            
            # 继续请求而不进行修改
            await tab.continue_request(request_id)
        
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, handle_request)
        
        await tab.go_to('https://example.com')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(basic_interception())
```

!!! info "类型提示以获得更好的 IDE 支持"
    使用 `RequestPausedEvent` 等类型提示来获得事件键的自动完成。所有事件类型都在 `pydoll.protocol.fetch.events` 中。

!!! note "生产就绪的等待"
    本指南中的示例使用 `asyncio.sleep()` 以简化。在生产代码中，考虑使用更明确的等待策略，如等待特定元素或实现网络空闲检测。有关高级技术，请参阅[网络监控](monitoring.md)指南。

## 常见用例

### 1. 阻止资源以节省带宽

阻止图片、样式表或其他资源以加快页面加载速度：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent
from pydoll.protocol.network.types import ErrorReason

async def block_images():
    async with Chrome() as browser:
        tab = await browser.start()
        
        blocked_count = 0
        
        async def block_resource(event: RequestPausedEvent):
            nonlocal blocked_count
            request_id = event['params']['requestId']
            resource_type = event['params']['resourceType']
            url = event['params']['request']['url']
            
            # 阻止图片和样式表
            if resource_type in ['Image', 'Stylesheet']:
                blocked_count += 1
                print(f"🚫 已阻止 {resource_type}: {url[:60]}")
                await tab.fail_request(request_id, ErrorReason.BLOCKED_BY_CLIENT)
            else:
                # 继续其他请求
                await tab.continue_request(request_id)
        
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, block_resource)
        
        await tab.go_to('https://example.com')
        await asyncio.sleep(3)
        
        print(f"\n📊 总共阻止: {blocked_count} 个资源")
        
        await tab.disable_fetch_events()

asyncio.run(block_images())
```

### 2. 修改请求头

在发送请求之前添加、修改或删除请求头：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent
from pydoll.protocol.fetch.types import HeaderEntry

async def modify_headers():
    async with Chrome() as browser:
        tab = await browser.start()
        
        async def add_custom_headers(event: RequestPausedEvent):
            request_id = event['params']['requestId']
            url = event['params']['request']['url']
            
            # 仅修改 API 请求
            if '/api/' in url:
                # 构建自定义请求头（使用 HeaderEntry 类型提示以获得 IDE 支持）
                headers: list[HeaderEntry] = [
                    {'name': 'X-Custom-Header', 'value': 'MyValue'},
                    {'name': 'Authorization', 'value': 'Bearer my-token-123'},
                ]
                
                print(f"✨ 已修改请求头: {url}")
                await tab.continue_request(request_id, headers=headers)
            else:
                await tab.continue_request(request_id)
        
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, add_custom_headers)
        
        await tab.go_to('https://your-app.com')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(modify_headers())
```

!!! tip "请求头类型提示"
    `HeaderEntry` 是来自 `pydoll.protocol.fetch.types` 的 `TypedDict`。将其用作类型提示可为您提供 `name` 和 `value` 键的 IDE 自动完成。您也可以使用普通字典而不使用类型提示。

!!! tip "请求头管理"
    当您提供自定义请求头时，它们会**替换**所有现有请求头。如果需要，请确保包含必要的请求头，如 `User-Agent`、`Accept` 等。

### 3. 模拟 API 响应

用自定义模拟数据替换真实的 API 响应：

```python
import asyncio
import json
import base64
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent
from pydoll.protocol.fetch.types import HeaderEntry

async def mock_api_responses():
    async with Chrome() as browser:
        tab = await browser.start()
        
        async def mock_response(event: RequestPausedEvent):
            request_id = event['params']['requestId']
            url = event['params']['request']['url']
            
            # 模拟特定的 API 端点
            if '/api/users' in url:
                # 创建模拟响应数据
                mock_data = {
                    'users': [
                        {'id': 1, 'name': 'Mock User 1'},
                        {'id': 2, 'name': 'Mock User 2'},
                    ],
                    'total': 2
                }
                
                # 转换为 JSON 并进行 base64 编码
                body_json = json.dumps(mock_data)
                body_base64 = base64.b64encode(body_json.encode()).decode()
                
                # 响应头
                headers: list[HeaderEntry] = [
                    {'name': 'Content-Type', 'value': 'application/json'},
                    {'name': 'Access-Control-Allow-Origin', 'value': '*'},
                ]
                
                print(f"🎭 已模拟响应: {url}")
                await tab.fulfill_request(
                    request_id=request_id,
                    response_code=200,
                    response_headers=headers,
                    body=body_base64,
                    response_phrase='OK'
                )
            else:
                # 正常继续其他请求
                await tab.continue_request(request_id)
        
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, mock_response)
        
        await tab.go_to('https://your-app.com')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(mock_api_responses())
```

!!! warning "需要 Base64 编码"
    `fulfill_request()` 中的 `body` 参数必须经过 base64 编码。使用 Python 的 `base64` 模块对响应数据进行编码。

### 4. 修改请求 URL

将请求重定向到不同的 URL：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent

async def redirect_requests():
    async with Chrome() as browser:
        tab = await browser.start()
        
        async def redirect_url(event: RequestPausedEvent):
            request_id = event['params']['requestId']
            original_url = event['params']['request']['url']
            
            # 将 CDN 请求重定向到本地服务器
            if 'cdn.example.com' in original_url:
                new_url = original_url.replace(
                    'cdn.example.com',
                    'localhost:8080'
                )
                print(f"🔀 已重定向: {original_url} → {new_url}")
                await tab.continue_request(request_id, url=new_url)
            else:
                await tab.continue_request(request_id)
        
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, redirect_url)
        
        await tab.go_to('https://example.com')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(redirect_requests())
```

### 5. 修改请求体

在发送之前修改 POST 数据：

```python
import asyncio
import base64
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent

async def modify_post_data():
    async with Chrome() as browser:
        tab = await browser.start()
        
        async def modify_body(event: RequestPausedEvent):
            request_id = event['params']['requestId']
            method = event['params']['request']['method']
            url = event['params']['request']['url']
            
            # 修改 POST 请求
            if method == 'POST' and '/api/submit' in url:
                # 创建新的 POST 数据
                new_data = '{"modified": true, "timestamp": 123456789}'
                post_data_base64 = base64.b64encode(new_data.encode()).decode()
                
                print(f"✏️  已修改 POST 数据: {url}")
                await tab.continue_request(
                    request_id,
                    post_data=post_data_base64
                )
            else:
                await tab.continue_request(request_id)
        
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, modify_body)
        
        await tab.go_to('https://your-app.com/form')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(modify_post_data())
```

### 6. 处理身份验证挑战

手动响应 HTTP 身份验证挑战（基本身份验证、摘要身份验证等）：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, AuthRequiredEvent
from pydoll.protocol.fetch.types import AuthChallengeResponseType

async def handle_auth():
    async with Chrome() as browser:
        tab = await browser.start()
        
        async def respond_to_auth(event: AuthRequiredEvent):
            request_id = event['params']['requestId']
            auth_challenge = event['params']['authChallenge']
            
            print(f"🔐 来自以下来源的身份验证挑战: {auth_challenge['origin']}")
            print(f"   方案: {auth_challenge['scheme']}")
            print(f"   领域: {auth_challenge.get('realm', 'N/A')}")
            
            # 为身份验证挑战提供凭据
            await tab.continue_with_auth(
                request_id=request_id,
                auth_challenge_response=AuthChallengeResponseType.PROVIDE_CREDENTIALS,
                proxy_username='myuser',
                proxy_password='mypassword'
            )
        
        # 启用并处理身份验证
        await tab.enable_fetch_events(handle_auth=True)
        await tab.on(FetchEvent.AUTH_REQUIRED, respond_to_auth)
        
        await tab.go_to('https://httpbin.org/basic-auth/myuser/mypassword')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(handle_auth())
```

!!! note "自动代理身份验证"
    **Pydoll 在您通过浏览器选项配置代理凭据时会自动处理代理身份验证**（407 需要代理身份验证）。此示例演示了身份验证挑战的**手动处理**，这对于以下情况很有用：
    
    - 来自服务器的 HTTP 基本/摘要身份验证（401 未经授权）
    - 自定义身份验证流程
    - 基于挑战的动态凭据选择
    - 测试身份验证失败场景
    
    对于标准代理使用，只需在浏览器选项中配置您的代理凭据 - 无需手动处理！

### 7. 模拟网络错误

测试您的应用程序如何处理网络故障：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent
from pydoll.protocol.network.types import ErrorReason

async def simulate_errors():
    async with Chrome() as browser:
        tab = await browser.start()
        
        request_count = 0
        
        async def fail_some_requests(event: RequestPausedEvent):
            nonlocal request_count
            request_id = event['params']['requestId']
            url = event['params']['request']['url']
            
            request_count += 1
            
            # 每三个请求失败一次
            if request_count % 3 == 0:
                print(f"❌ 模拟超时: {url[:60]}")
                await tab.fail_request(request_id, ErrorReason.TIMED_OUT)
            else:
                await tab.continue_request(request_id)
        
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, fail_some_requests)
        
        await tab.go_to('https://example.com')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(simulate_errors())
```

## 请求阶段

您可以在不同阶段拦截请求：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.types import RequestStage

async def intercept_responses():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # 拦截响应而不是请求
        await tab.enable_fetch_events(request_stage=RequestStage.RESPONSE)
        
        # 现在您可以在响应到达页面之前修改它们
        await tab.go_to('https://example.com')
        await asyncio.sleep(3)
        
        await tab.disable_fetch_events()

asyncio.run(intercept_responses())
```

| 阶段 | 拦截时机 | 用例 |
|-------|------------------|-----------|
| `Request`（默认） | 请求发送之前 | 修改请求头、阻止请求、更改 URL |
| `Response` | 接收响应之后 | 修改响应体、更改状态码 |

!!! tip "响应拦截"
    在拦截响应时，您可以在 `continue_request()` 中使用 `intercept_response=True` 来同时拦截该特定请求的响应。

## 资源类型参考

| 资源类型 | 描述 | 常见文件扩展名 |
|---------------|-------------|------------------------|
| `Document` | HTML 文档 | `.html` |
| `Stylesheet` | CSS 文件 | `.css` |
| `Image` | 图片资源 | `.jpg`、`.png`、`.gif`、`.webp`、`.svg` |
| `Media` | 音频/视频 | `.mp4`、`.webm`、`.mp3`、`.ogg` |
| `Font` | 网络字体 | `.woff`、`.woff2`、`.ttf`、`.otf` |
| `Script` | JavaScript | `.js` |
| `TextTrack` | 字幕 | `.vtt`、`.srt` |
| `XHR` | XMLHttpRequest | AJAX 请求 |
| `Fetch` | Fetch API | 现代 API 调用 |
| `EventSource` | 服务器发送事件 | 实时流 |
| `WebSocket` | WebSocket | 双向通信 |
| `Manifest` | Web 应用清单 | PWA 配置 |
| `Other` | 其他类型 | 杂项 |

## 错误原因参考

在 `fail_request()` 中使用这些来模拟不同的网络故障：

| 错误原因 | 描述 | 用例 |
|--------------|-------------|----------|
| `FAILED` | 通用失败 | 常规错误 |
| `ABORTED` | 请求中止 | 用户取消 |
| `TIMED_OUT` | 请求超时 | 网络超时 |
| `ACCESS_DENIED` | 访问被拒绝 | 权限错误 |
| `CONNECTION_CLOSED` | 连接关闭 | 服务器断开连接 |
| `CONNECTION_RESET` | 连接重置 | 网络重置 |
| `CONNECTION_REFUSED` | 连接被拒绝 | 服务器无法访问 |
| `NAME_NOT_RESOLVED` | DNS 失败 | 无效的主机名 |
| `INTERNET_DISCONNECTED` | 无互联网 | 离线模式 |
| `BLOCKED_BY_CLIENT` | 客户端阻止 | 广告拦截器模拟 |
| `BLOCKED_BY_RESPONSE` | 响应被阻止 | CORS/CSP 违规 |

## 最佳实践

### 1. 始终继续或使请求失败

```python
# 好：每个暂停的请求都得到处理
async def handle_request(event: RequestPausedEvent):
    request_id = event['params']['requestId']
    try:
        # 您的逻辑在这里
        await tab.continue_request(request_id)
    except Exception as e:
        # 出错时失败以防止挂起
        await tab.fail_request(request_id, ErrorReason.FAILED)

# 坏：如果回调引发异常，请求可能会挂起
async def handle_request(event: RequestPausedEvent):
    request_id = event['params']['requestId']
    # 如果引发异常，请求将永远挂起
    await tab.continue_request(request_id)
```

### 2. 使用选择性拦截

```python
# 好：仅拦截您需要的内容
await tab.enable_fetch_events(resource_type='Image')

# 坏：拦截所有内容，减慢所有请求
await tab.enable_fetch_events()
```

### 3. 完成后禁用

```python
# 好：完成后清理
await tab.enable_fetch_events()
# ... 执行工作 ...
await tab.disable_fetch_events()

# 坏：使拦截保持启用状态
await tab.enable_fetch_events()
# ... 执行工作 ...
# （从未禁用）
```

### 4. 优雅地处理错误

```python
# 好：包装在 try/except 中
async def safe_handler(event: RequestPausedEvent):
    request_id = event['params']['requestId']
    try:
        # 可能失败的复杂逻辑
        modified_url = transform_url(event['params']['request']['url'])
        await tab.continue_request(request_id, url=modified_url)
    except Exception as e:
        print(f"处理请求时出错: {e}")
        # 出错时继续而不进行修改
        await tab.continue_request(request_id)
```

## 完整示例：高级请求控制

这是一个结合多种拦截技术的完整示例：

```python
import asyncio
import base64
import json
from pydoll.browser.chromium import Chrome
from pydoll.protocol.fetch.events import FetchEvent, RequestPausedEvent
from pydoll.protocol.fetch.types import HeaderEntry
from pydoll.protocol.network.types import ErrorReason

async def advanced_interception():
    async with Chrome() as browser:
        tab = await browser.start()
        
        stats = {
            'blocked': 0,
            'mocked': 0,
            'modified': 0,
            'continued': 0
        }
        
        async def intelligent_handler(event: RequestPausedEvent):
            request_id = event['params']['requestId']
            url = event['params']['request']['url']
            resource_type = event['params']['resourceType']
            method = event['params']['request']['method']
            
            try:
                # 阻止广告和跟踪器
                if any(tracker in url for tracker in ['analytics', 'ads', 'tracking']):
                    stats['blocked'] += 1
                    print(f"🚫 已阻止跟踪器: {url[:50]}")
                    await tab.fail_request(request_id, ErrorReason.BLOCKED_BY_CLIENT)
                
                # 模拟 API 响应
                elif '/api/config' in url:
                    stats['mocked'] += 1
                    mock_config = {'feature_x': True, 'debug_mode': False}
                    body = base64.b64encode(json.dumps(mock_config).encode()).decode()
                    headers: list[HeaderEntry] = [
                        {'name': 'Content-Type', 'value': 'application/json'},
                    ]
                    print(f"🎭 已模拟配置 API")
                    await tab.fulfill_request(
                        request_id, 200, headers, body, 'OK'
                    )
                
                # 为 API 请求添加身份验证头
                elif '/api/' in url and method == 'GET':
                    stats['modified'] += 1
                    headers: list[HeaderEntry] = [
                        {'name': 'Authorization', 'value': 'Bearer token-123'},
                    ]
                    print(f"✨ 已添加身份验证: {url[:50]}")
                    await tab.continue_request(request_id, headers=headers)
                
                # 正常继续其他所有内容
                else:
                    stats['continued'] += 1
                    await tab.continue_request(request_id)
                    
            except Exception as e:
                print(f"⚠️  处理请求时出错: {e}")
                # 出错时始终继续以防止挂起
                await tab.continue_request(request_id)
        
        # 启用拦截
        await tab.enable_fetch_events()
        await tab.on(FetchEvent.REQUEST_PAUSED, intelligent_handler)
        
        # 导航
        await tab.go_to('https://example.com')
        await asyncio.sleep(5)
        
        # 打印统计信息
        print(f"\n📊 拦截统计:")
        print(f"   已阻止: {stats['blocked']}")
        print(f"   已模拟: {stats['mocked']}")
        print(f"   已修改: {stats['modified']}")
        print(f"   已继续: {stats['continued']}")
        print(f"   总计: {sum(stats.values())}")
        
        # 清理
        await tab.disable_fetch_events()

asyncio.run(advanced_interception())
```

## 另请参阅

- **[网络监控](monitoring.md)** - 被动网络流量观察
- **[CDP Fetch 域](../../deep-dive/network-capabilities.md#fetch-domain)** - 深入了解 Fetch 域
- **[事件系统](../advanced/event-system.md)** - 了解 Pydoll 的事件架构

请求拦截是用于测试、优化和模拟的强大工具。掌握这些技术以构建强大、高效的浏览器自动化脚本。


================================================
FILE: docs/zh/features/network/monitoring.md
================================================
# 网络监控

Pydoll 中的网络监控允许您在浏览器自动化期间观察和分析 HTTP 请求、响应和其他网络活动。这对于调试、性能分析、API 测试和了解 Web 应用程序如何与服务器通信至关重要。

!!! info "Network 与 Fetch 域"
    **Network 域**用于被动监控（观察流量）。**Fetch 域**用于主动拦截（修改请求/响应）。本指南重点介绍监控。有关请求拦截，请参阅高级文档。

## 启用网络事件

在监控网络活动之前，您必须启用 Network 域：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def main():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # 启用网络监控
        await tab.enable_network_events()
        
        # 现在导航
        await tab.go_to('https://api.github.com')
        
        # 完成后不要忘记禁用（可选但推荐）
        await tab.disable_network_events()

asyncio.run(main())
```

!!! warning "导航前启用"
    始终在导航**之前**启用网络事件以捕获所有请求。在启用之前发起的请求不会被捕获。

## 获取网络日志

启用网络事件后，Pydoll 会自动存储网络日志。您可以使用 `get_network_logs()` 检索它们：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def analyze_requests():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        
        # 导航到页面
        await tab.go_to('https://httpbin.org/json')
        
        # 等待页面完全加载
        await asyncio.sleep(2)
        
        # 获取所有网络日志
        logs = await tab.get_network_logs()
        
        print(f"捕获的总请求数: {len(logs)}")
        
        for log in logs:
            request = log['params']['request']
            print(f"→ {request['method']} {request['url']}")

asyncio.run(analyze_requests())
```

!!! note "生产就绪的等待"
    上面的示例为简单起见使用 `asyncio.sleep(2)`。在生产代码中，请考虑使用更明确的等待策略：
    
    - 等待特定元素出现
    - 使用[事件系统](../advanced/event-system.md)来检测何时加载所有资源
    - 实现网络空闲检测（参见实时网络监控部分）
    
    这确保您的自动化等待的时间正好合适，不多不少。

### 过滤网络日志

您可以按 URL 模式过滤日志：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def filter_logs_example():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        await tab.go_to('https://example.com')
        await asyncio.sleep(2)
        
        # 获取所有日志
        all_logs = await tab.get_network_logs()
        
        # 获取特定域的日志
        api_logs = await tab.get_network_logs(filter='api.example.com')
        
        # 获取特定端点的日志
        user_logs = await tab.get_network_logs(filter='/api/users')

asyncio.run(filter_logs_example())
```

## 理解网络事件结构

网络日志包含有关每个请求的详细信息。以下是结构：

### RequestWillBeSentEvent

此事件在即将发送请求时触发：

```python
{
    'method': 'Network.requestWillBeSent',
    'params': {
        'requestId': 'unique-request-id',
        'loaderId': 'loader-id',
        'documentURL': 'https://example.com',
        'request': {
            'url': 'https://api.example.com/data',
            'method': 'GET',  # 或 'POST'、'PUT'、'DELETE' 等
            'headers': {
                'User-Agent': 'Chrome/...',
                'Accept': 'application/json',
                ...
            },
            'postData': '...',  # 仅存在于 POST/PUT 请求
            'initialPriority': 'High',
            'referrerPolicy': 'strict-origin-when-cross-origin'
        },
        'timestamp': 1234567890.123,
        'wallTime': 1234567890.123,
        'initiator': {
            'type': 'script',  # 或 'parser'、'other'
            'stack': {...}  # 如果从脚本发起则有调用堆栈
        },
        'type': 'XHR',  # 资源类型：Document、Script、Image、XHR 等
        'frameId': 'frame-id',
        'hasUserGesture': False
    }
}
```

### 关键字段参考

| 字段 | 位置 | 类型 | 描述 |
|-------|----------|------|-------------|
| `requestId` | `params.requestId` | `str` | 此请求的唯一标识符 |
| `url` | `params.request.url` | `str` | 完整的请求 URL |
| `method` | `params.request.method` | `str` | HTTP 方法（GET、POST 等）|
| `headers` | `params.request.headers` | `dict` | 请求标头 |
| `postData` | `params.request.postData` | `str` | 请求体（POST/PUT）|
| `timestamp` | `params.timestamp` | `float` | 请求开始的单调时间 |
| `type` | `params.type` | `str` | 资源类型（Document、XHR、Image 等）|
| `initiator` | `params.initiator` | `dict` | 触发此请求的内容 |

## 获取响应体

要获取实际的响应内容，请使用 `get_network_response_body()`：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def fetch_api_response():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        
        # 导航到 API 端点
        await tab.go_to('https://httpbin.org/json')
        await asyncio.sleep(2)
        
        # 获取所有请求
        logs = await tab.get_network_logs()
        
        for log in logs:
            request_id = log['params']['requestId']
            url = log['params']['request']['url']
            
            # 仅获取 JSON 端点的响应
            if 'httpbin.org/json' in url:
                try:
                    # 获取响应体
                    response_body = await tab.get_network_response_body(request_id)
                    print(f"来自 {url} 的响应:")
                    print(response_body)
                except Exception as e:
                    print(f"无法获取响应体: {e}")

asyncio.run(fetch_api_response())
```

!!! warning "响应体可用性"
    响应体仅适用于已完成的请求。此外，某些响应类型（如图像或重定向）可能没有可访问的响应体。

## 实际用例

### 1. API 测试和验证

监控 API 调用以验证是否正在进行正确的请求：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def validate_api_calls():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        
        # 导航到您的应用
        await tab.go_to('https://your-app.com')
        
        # 触发某些进行 API 调用的操作
        button = await tab.find(id='load-data-button')
        await button.click()
        await asyncio.sleep(2)
        
        # 获取 API 日志
        api_logs = await tab.get_network_logs(filter='/api/')
        
        print(f"\n📊 API 调用摘要:")
        print(f"总 API 调用数: {len(api_logs)}")
        
        for log in api_logs:
            request = log['params']['request']
            method = request['method']
            url = request['url']
            
            # 检查是否存在正确的认证标头
            headers = request.get('headers', {})
            has_auth = 'Authorization' in headers or 'authorization' in headers
            
            print(f"\n{method} {url}")
            print(f"  ✓ 有授权: {has_auth}")
            
            # 如果适用，验证 POST 数据
            if method == 'POST' and 'postData' in request:
                print(f"  📤 正文: {request['postData'][:100]}...")

asyncio.run(validate_api_calls())
```

### 2. 性能分析

分析请求时序并识别慢速资源：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def analyze_performance():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        
        await tab.go_to('https://example.com')
        await asyncio.sleep(5)
        
        logs = await tab.get_network_logs()
        
        # 存储时序数据
        timings = []
        
        for log in logs:
            params = log['params']
            request_id = params['requestId']
            url = params['request']['url']
            resource_type = params.get('type', 'Other')
            
            timings.append({
                'url': url,
                'type': resource_type,
                'timestamp': params['timestamp']
            })
        
        # 按时间戳排序
        timings.sort(key=lambda x: x['timestamp'])
        
        print("\n⏱️  请求时间线:")
        start_time = timings[0]['timestamp'] if timings else 0
        
        for timing in timings[:20]:  # 显示前 20 个
            elapsed = (timing['timestamp'] - start_time) * 1000  # 转换为毫秒
            print(f"{elapsed:7.0f}ms | {timing['type']:12} | {timing['url'][:80]}")

asyncio.run(analyze_performance())
```

### 3. 检测外部资源

查找您的页面连接到的所有外部域：

```python
import asyncio
from urllib.parse import urlparse
from collections import Counter
from pydoll.browser.chromium import Chrome

async def analyze_domains():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        
        await tab.go_to('https://news.ycombinator.com')
        await asyncio.sleep(5)
        
        logs = await tab.get_network_logs()
        
        # 计算每个域的请求数
        domains = Counter()
        
        for log in logs:
            url = log['params']['request']['url']
            try:
                domain = urlparse(url).netloc
                if domain:
                    domains[domain] += 1
            except:
                pass
        
        print("\n🌐 外部域:")
        for domain, count in domains.most_common(10):
            print(f"  {count:3} 个请求 | {domain}")

asyncio.run(analyze_domains())
```

### 4. 监控特定资源类型

跟踪特定类型的资源，如图像或脚本：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def track_resource_types():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        
        await tab.go_to('https://example.com')
        await asyncio.sleep(3)
        
        logs = await tab.get_network_logs()
        
        # 按资源类型分组
        by_type = {}
        
        for log in logs:
            params = log['params']
            resource_type = params.get('type', 'Other')
            url = params['request']['url']
            
            if resource_type not in by_type:
                by_type[resource_type] = []
            
            by_type[resource_type].append(url)
        
        print("\n📦 按类型分类的资源:")
        for rtype in sorted(by_type.keys()):
            urls = by_type[rtype]
            print(f"\n{rtype}: {len(urls)} 个资源")
            for url in urls[:3]:  # 显示前 3 个
                print(f"  • {url}")
            if len(urls) > 3:
                print(f"  ... 还有 {len(urls) - 3} 个")

asyncio.run(track_resource_types())
```

## 实时网络监控

对于实时监控，使用事件回调而不是轮询 `get_network_logs()`：

!!! info "理解事件"
    实时监控使用 Pydoll 的事件系统来响应发生的网络活动。要深入了解事件的工作原理，请参阅 **[事件系统](../advanced/event-system.md)**。

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.network.events import (
    NetworkEvent,
    RequestWillBeSentEvent,
    ResponseReceivedEvent,
    LoadingFailedEvent
)

async def real_time_monitoring():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # 统计
        stats = {
            'requests': 0,
            'responses': 0,
            'failed': 0
        }
        
        # 请求回调
        async def on_request(event: RequestWillBeSentEvent):
            stats['requests'] += 1
            url = event['params']['request']['url']
            method = event['params']['request']['method']
            print(f"→ {method:6} | {url}")
        
        # 响应回调
        async def on_response(event: ResponseReceivedEvent):
            stats['responses'] += 1
            response = event['params']['response']
            status = response['status']
            url = response['url']
            
            # 按状态着色
            if 200 <= status < 300:
                color = '\033[92m'  # 绿色
            elif 300 <= status < 400:
                color = '\033[93m'  # 黄色
            else:
                color = '\033[91m'  # 红色
            reset = '\033[0m'
            
            print(f"← {color}{status}{reset} | {url}")
        
        # 失败回调
        async def on_failed(event: LoadingFailedEvent):
            stats['failed'] += 1
            error = event['params']['errorText']
            print(f"✗ 失败: {error}")
        
        # 启用并注册回调
        await tab.enable_network_events()
        await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, on_request)
        await tab.on(NetworkEvent.RESPONSE_RECEIVED, on_response)
        await tab.on(NetworkEvent.LOADING_FAILED, on_failed)
        
        # 导航
        await tab.go_to('https://example.com')
        await asyncio.sleep(5)
        
        print(f"\n📊 摘要:")
        print(f"  请求: {stats['requests']}")
        print(f"  响应: {stats['responses']}")
        print(f"  失败: {stats['failed']}")

asyncio.run(real_time_monitoring())
```

## 资源类型参考

Pydoll 捕获以下资源类型：

| 类型 | 描述 | 示例 |
|------|-------------|----------|
| `Document` | 主 HTML 文档 | 页面加载、iframe 源 |
| `Stylesheet` | CSS 文件 | 外部 .css、内联样式 |
| `Image` | 图像资源 | .jpg、.png、.gif、.webp、.svg |
| `Media` | 音频/视频文件 | .mp4、.webm、.mp3、.ogg |
| `Font` | Web 字体 | .woff、.woff2、.ttf、.otf |
| `Script` | JavaScript 文件 | .js 文件、内联脚本 |
| `TextTrack` | 字幕文件 | .vtt、.srt |
| `XHR` | XMLHttpRequest | AJAX 请求、旧版 API 调用 |
| `Fetch` | Fetch API 请求 | 现代 API 调用 |
| `EventSource` | 服务器发送事件 | 实时流 |
| `WebSocket` | WebSocket 连接 | 双向通信 |
| `Manifest` | Web 应用清单 | PWA 配置 |
| `Other` | 其他资源类型 | 杂项 |

## 高级：提取响应时序

网络事件包括详细的时序信息：

```python
import asyncio
from pydoll.browser.chromium import Chrome
from pydoll.protocol.network.events import NetworkEvent, ResponseReceivedEvent

async def analyze_timing():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        
        # 自定义回调以捕获时序
        timing_data = []
        
        async def on_response(event: ResponseReceivedEvent):
            response = event['params']['response']
            timing = response.get('timing')
            
            if timing:
                # 计算不同阶段
                dns_time = timing.get('dnsEnd', 0) - timing.get('dnsStart', 0)
                connect_time = timing.get('connectEnd', 0) - timing.get('connectStart', 0)
                ssl_time = timing.get('sslEnd', 0) - timing.get('sslStart', 0)
                send_time = timing.get('sendEnd', 0) - timing.get('sendStart', 0)
                wait_time = timing.get('receiveHeadersStart', 0) - timing.get('sendEnd', 0)
                receive_time = timing.get('receiveHeadersEnd', 0) - timing.get('receiveHeadersStart', 0)
                
                timing_data.append({
                    'url': response['url'][:50],
                    'dns': dns_time if dns_time > 0 else 0,
                    'connect': connect_time if connect_time > 0 else 0,
                    'ssl': ssl_time if ssl_time > 0 else 0,
                    'send': send_time,
                    'wait': wait_time,
                    'receive': receive_time,
                    'total': receive_time + wait_time + send_time
                })
        
        await tab.on(NetworkEvent.RESPONSE_RECEIVED, on_response)
        await tab.go_to('https://github.com')
        await asyncio.sleep(5)
        
        # 打印时序分解
        print("\n⏱️  请求时序分解（毫秒）:")
        print(f"{'URL':<50} | {'DNS':>6} | {'连接':>8} | {'SSL':>6} | {'发送':>6} | {'等待':>6} | {'接收':>8} | {'总计':>7}")
        print("-" * 120)
        
        for data in sorted(timing_data, key=lambda x: x['total'], reverse=True)[:10]:
            print(f"{data['url']:<50} | {data['dns']:6.1f} | {data['connect']:8.1f} | {data['ssl']:6.1f} | "
                  f"{data['send']:6.1f} | {data['wait']:6.1f} | {data['receive']:8.1f} | {data['total']:7.1f}")

asyncio.run(analyze_timing())
```

## 时序字段说明

| 阶段 | 字段 | 描述 |
|-------|--------|-------------|
| **DNS** | `dnsStart` → `dnsEnd` | DNS 查找时间 |
| **连接** | `connectStart` → `connectEnd` | TCP 连接建立 |
| **SSL** | `sslStart` → `sslEnd` | SSL/TLS 握手 |
| **发送** | `sendStart` → `sendEnd` | 发送请求的时间 |
| **等待** | `sendEnd` → `receiveHeadersStart` | 等待服务器响应（TTFB）|
| **接收** | `receiveHeadersStart` → `receiveHeadersEnd` | 接收响应标头的时间 |

!!! tip "首字节时间（TTFB）"
    TTFB 是"等待"阶段 - 发送请求和接收响应的第一个字节之间的时间。这对于性能分析至关重要。

## 最佳实践

### 1. 仅在需要时启用网络事件

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def best_practice_enable():
    async with Chrome() as browser:
        tab = await browser.start()
        
        # ✅ 好：导航前启用，之后禁用
        await tab.enable_network_events()
        await tab.go_to('https://example.com')
        await asyncio.sleep(2)
        logs = await tab.get_network_logs()
        await tab.disable_network_events()
        
        # ❌ 不好：在整个会话期间保持启用
        # await tab.enable_network_events()
        # ... 长时间的自动化会话 ...
```

### 2. 过滤日志以减少内存使用

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def best_practice_filter():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        await tab.go_to('https://example.com')
        await asyncio.sleep(2)
        
        # ✅ 好：过滤特定请求
        api_logs = await tab.get_network_logs(filter='/api/')
        
        # ❌ 不好：当您只需要特定日志时获取所有日志
        all_logs = await tab.get_network_logs()
        filtered = [log for log in all_logs if '/api/' in log['params']['request']['url']]
```

### 3. 安全地处理缺失字段

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def best_practice_safe_access():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.enable_network_events()
        await tab.go_to('https://example.com')
        await asyncio.sleep(2)
        
        logs = await tab.get_network_logs()
        
        # ✅ 好：使用 .get() 安全访问
        for log in logs:
            params = log.get('params', {})
            request = params.get('request', {})
            url = request.get('url', 'Unknown')
            post_data = request.get('postData')  # 可能为 None
            
            if post_data:
                print(f"POST 数据: {post_data}")
        
        # ❌ 不好：直接访问可能引发 KeyError
        # url = log['params']['request']['url']
        # post_data = log['params']['request']['postData']  # 可能不存在！
```

### 4. 对实时需求使用事件回调

```python
import asyncio
from pydoll.protocol.network.events import NetworkEvent, RequestWillBeSentEvent

# ✅ 好：使用回调进行实时监控
async def on_request(event: RequestWillBeSentEvent):
    print(f"新请求: {event['params']['request']['url']}")

await tab.on(NetworkEvent.REQUEST_WILL_BE_SENT, on_request)

# ❌ 不好：重复轮询日志（效率低）
while True:
    logs = await tab.get_network_logs()
    # 处理日志...
    await asyncio.sleep(0.5)  # 浪费！
```

## 另请参阅

- **[CDP Network 域](../../deep-dive/network-capabilities.md)** - 深入了解网络功能
- **[事件系统](../advanced/event-system.md)** - 了解 Pydoll 的事件架构
- **[请求拦截](interception.md)** - 修改请求和响应


================================================
FILE: docs/zh/features/network/network-recording.md
================================================
# HAR 网络录制

捕获浏览器会话期间的所有网络活动，并导出为标准 HAR (HTTP Archive) 1.2 文件。非常适合调试、性能分析和测试固件。

!!! tip "像专家一样调试"
    HAR 文件是录制网络流量的行业标准。您可以将它们直接导入 Chrome DevTools、Charles Proxy 或任何 HAR 查看器进行详细分析。

## 为什么使用 HAR 录制？

| 使用场景 | 优势 |
|---------|------|
| 调试失败的请求 | 查看确切的 headers、时序和响应体 |
| 性能分析 | 识别慢速请求和瓶颈 |
| API 文档 | 捕获真实的请求/响应对 |
| 测试固件 | 录制真实流量用于测试模拟 |

## 快速开始

录制页面导航期间的所有网络流量：

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def record_traffic():
    async with Chrome() as browser:
        tab = await browser.start()

        async with tab.request.record() as capture:
            await tab.go_to('https://example.com')

        # 保存捕获为 HAR 文件
        capture.save('flow.har')
        print(f'捕获了 {len(capture.entries)} 个请求')

asyncio.run(record_traffic())
```

## 录制 API

### `tab.request.record(resource_types=None)`

上下文管理器，捕获标签页上的网络流量。

| 参数 | 类型 | 描述 |
|------|------|------|
| `resource_types` | `list[ResourceType] \| None` | 可选的资源类型列表。当为 `None`（默认）时，捕获所有类型。 |

```python
async with tab.request.record() as capture:
    # 此块内的所有网络活动都会被捕获
    await tab.go_to('https://example.com')
    await (await tab.find(id='search')).type_text('pydoll')
    await (await tab.find(type='submit')).click()
```

`capture` 对象（`HarCapture`）提供：

| 属性/方法 | 描述 |
|----------|------|
| `capture.entries` | 捕获的 HAR 条目列表 |
| `capture.to_dict()` | 完整的 HAR 1.2 字典（用于自定义处理） |
| `capture.save(path)` | 保存为 HAR JSON 文件 |

### 按资源类型过滤

仅录制特定资源类型而非所有流量：

```python
from pydoll.protocol.network.types import ResourceType

# 仅录制 fetch/XHR 请求（跳过文档、图像等）
async with tab.request.record(
    resource_types=[ResourceType.FETCH, ResourceType.XHR]
) as capture:
    await tab.go_to('https://example.com')

# 仅录制文档和样式表请求
async with tab.request.record(
    resource_types=[ResourceType.DOCUMENT, ResourceType.STYLESHEET]
) as capture:
    await tab.go_to('https://example.com')
```

可用的 `ResourceType` 值：

| 值 | 描述 |
|----|------|
| `ResourceType.DOCUMENT` | HTML 文档 |
| `ResourceType.STYLESHEET` | CSS 样式表 |
| `ResourceType.SCRIPT` | JavaScript 文件 |
| `ResourceType.IMAGE` | 图像 |
| `ResourceType.FONT` | Web 字体 |
| `ResourceType.MEDIA` | 音频/视频 |
| `ResourceType.FETCH` | Fetch API 请求 |
| `ResourceType.XHR` | XMLHttpRequest 调用 |
| `ResourceType.WEB_SOCKET` | WebSocket 连接 |
| `ResourceType.OTHER` | 其他资源类型 |

### 保存捕获

```python
# 保存为 HAR 文件（可以在 Chrome DevTools 中打开）
capture.save('flow.har')

# 保存到嵌套目录（自动创建）
capture.save('recordings/session1/flow.har')

# 访问原始 HAR 字典进行自定义处理
har_dict = capture.to_dict()
print(har_dict['log']['version'])  # "1.2"
```

### 检查条目

```python
async with tab.request.record() as capture:
    await tab.go_to('https://example.com')

for entry in capture.entries:
    req = entry['request']
    resp = entry['response']
    print(f"{req['method']} {req['url']} -> {resp['status']}")
```

## 高级用法

### 过滤捕获的条目

```python
async with tab.request.record() as capture:
    await tab.go_to('https://example.com')

# 仅过滤 API 调用
api_entries = [
    e for e in capture.entries
    if '/api/' in e['request']['url']
]

# 仅过滤失败的请求
failed = [
    e for e in capture.entries
    if e['response']['status'] >= 400
]
```

### 自定义 HAR 处理

```python
har = capture.to_dict()

# 按类型统计请求
from collections import Counter
types = Counter(
    e.get('_resourceType', 'Other')
    for e in har['log']['entries']
)
print(types)  # Counter({'Document': 1, 'Script': 5, 'Stylesheet': 3, ...})
```

## HAR 文件格式

导出的 HAR 遵循 [HAR 1.2 规范](http://www.softwareishard.com/blog/har-12-spec/)。每个条目包含：

- **Request**：方法、URL、headers、查询参数、POST 数据
- **Response**：状态、headers、响应体内容（文本或 base64 编码）
- **Timings**：DNS、连接、SSL、发送、等待（TTFB）、接收
- **Metadata**：服务器 IP、连接 ID、资源类型

!!! note "响应体"
    响应体在每个请求完成后自动捕获。二进制内容（图像、字体等）存储为 base64 编码的字符串。


================================================
FILE: docs/zh/index.md
================================================
<p align="center">
    <img src="../resources/images/logo.png" alt="Pydoll Logo" /> <br><br>
</p>

<p align="center">
    <a href="https://codecov.io/gh/autoscrape-labs/pydoll">
        <img src="https://codecov.io/gh/autoscrape-labs/pydoll/graph/badge.svg?token=40I938OGM9"/> 
    </a>
    <img src="https://github.com/thalissonvs/pydoll/actions/workflows/tests.yml/badge.svg" alt="Tests">
    <img src="https://github.com/thalissonvs/pydoll/actions/workflows/ruff-ci.yml/badge.svg" alt="Ruff CI">
    <img src="https://github.com/thalissonvs/pydoll/actions/workflows/release.yml/badge.svg" alt="Release">
    <img src="https://github.com/thalissonvs/pydoll/actions/workflows/mypy.yml/badge.svg" alt="MyPy CI">
</p>


# 欢迎使用Pydoll

欢迎来到 Pydoll 的世界～这是为 Python 量身打造的新一代浏览器自动化神器！

## 什么是Pydoll?

Pydoll采用全新的浏览器自动化技术——完全无需 WebDriver！与其他依赖外部驱动的解决方案不同，Pydoll 通过浏览器原生 DevTools 协议直接通信，提供零依赖的自动化体验，并自带原生异步高性能支持。

无论是数据采集、[Web应用测试](https://www.lambdatest.com/web-testing)，还是自动化重复任务，Pydoll 都能通过其直观的 API 和强大功能，让这些工作变得异常简单。  

## 安装

创建并激活一个 [虚拟环境](https://docs.python.org/3/tutorial/venv.html)，然后安装Pydoll:

<div class="termy">
```bash
$ pip install pydoll-python

---> 100%
```
</div>

你可以直接在GitHub上找到最新的开发版本:

```bash
$ pip install git+https://github.com/autoscrape-labs/pydoll.git
```

## 为何选择Pydoll?

- **智能验证码绕过**: 内置Cloudflare Turnstile与reCAPTCHA v3验证码的自动破解能力，无需依赖外部服务、API密钥或复杂配置。即使遭遇防护系统，您的自动化流程仍可畅行无阻。
- **模拟真人交互**: 通过先进算法模拟真实人类行为特征——通过随机操作间隔，到鼠标移动轨迹、页面滚动模式乃至输入速度，皆可骗过最严苛的反爬虫系统。
- **极简哲学**: 无需浪费太多时间在配置驱动或解决兼容问题上。Pydoll开箱即用。
- **原生异步性能**: 基于`asyncio`库深度设计, Pydoll不仅支持异步操作——更为高并发而生，可同时进行多个受防护站点的数据采集。
- **强大的网络监控**: 轻松实现请求拦截、流量篡改与响应分析，完整掌控网络通信链路，轻松突破层层防护体系。
- **事件驱动架构**: 实时响应页面事件、网络请求与用户交互，构建能动态适应防护系统的智能自动化流。
- **直观的元素定位**: 使用符合人类直觉的定位方法 `find()` 和 `query()` ，面对动态加载的防护内容，定位依然精准。
- **强类型安全**: 完备的类型系统为复杂自动化场景提供更优IDE支持和更好地预防运行时报错。


准备好开始了吗？以下内容将带您从安装配置、基础使用到高级功能，全面掌握 Pydoll 的最佳实践。

让我们以最优雅的方式，开启您的网页自动化之旅！🚀

## 简单的例子上手

让我们从一个实际案例开始。以下脚本将打开 Pydoll 的 GitHub 仓库并star：  

```python
import asyncio
from pydoll.browser.chromium import Chrome

async def main():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://github.com/autoscrape-labs/pydoll')
        
        star_button = await tab.find(
            tag_name='button',
            timeout=5,
            raise_exc=False
        )
        if not star_button:
            print("Ops! The button was not found.")
            return

        await star_button.click()
        await asyncio.sleep(3)

asyncio.run(main())
```

此示例演示了如何导航到网站、等待元素出现并与之交互。您可以使用这样的模式来自动执行许多不同的 Web 任务。

??? note "或者使用不带上下文管理器的..."
    如果你不想要使用上下文管理器模式，你可以手动管理浏览器实例：
    
    ```python
    import asyncio
    from pydoll.browser.chromium import Chrome
    
    async def main():
        browser = Chrome()
        tab = await browser.start()
        await tab.go_to('https://github.com/autoscrape-labs/pydoll')
        
        star_button = await tab.find(
            tag_name='button',
            timeout=5,
            raise_exc=False
        )
        if not star_button:
            print("Ops! The button was not found.")
            return

        await star_button.click()
        await asyncio.sleep(3)
        await browser.stop()
    
    asyncio.run(main())
    ```
    
    Note that when not using the context manager, you'll need to explicitly call `browser.stop()` to release resources.

## 补充例子: 自定义浏览器配置

对于更高级的使用场景，Pydoll 允许您使用 `ChromiumOptions` 类自定义浏览器配置。此功能在您需要执行以下操作时非常有用：

- 在无头模式下运行（无可见浏览器窗口）
- 指定自定义浏览器可执行文件路径
- 配置代理、用户代理或其他浏览器设置
- 设置窗口尺寸或启动参数

以下示例展示了如何使用 Chrome 的自定义选项：

```python hl_lines="8-12 30-32 34-38"
import asyncio
import os
from pydoll.browser.chromium import Chrome
from pydoll.browser.options import ChromiumOptions

async def main():
    options = ChromiumOptions()
    options.binary_location = '/usr/bin/google-chrome-stable'
    options.add_argument('--headless=new')
    options.add_argument('--start-maximized')
    options.add_argument('--disable-notifications')
    
    async with Chrome(options=options) as browser:
        tab = await browser.start()
        await tab.go_to('https://github.com/autoscrape-labs/pydoll')
        
        star_button = await tab.find(
            tag_name='button',
            timeout=5,
            raise_exc=False
        )
        if not star_button:
            print("Ops! The button was not found.")
            return

        await star_button.click()
        await asyncio.sleep(3)

        screenshot_path = os.path.join(os.getcwd(), 'pydoll_repo.png')
        await tab.take_screenshot(path=screenshot_path)
        print(f"Screenshot saved to: {screenshot_path}")

        base64_screenshot = await tab.take_screenshot(as_base64=True)

        repo_description_element = await tab.find(
            class_name='f4.my-3'
        )
        repo_description = await repo_description_element.text
        print(f"Repository description: {repo_description}")

if __name__ == "__main__":
    asyncio.run(main())
```


此扩展示例演示了：

1. 创建和配置浏览器选项
2. 设置自定义Chrome可执行程序路径
3. 启用无头模式以实现无痕操作
4. 设置其他浏览器命令行flags
5. 屏幕截图（在无头模式下尤其有用）

??? info "关于Chrome配置选项"
    The `options.add_argument()` 方法允许您传递任何 Chromium 命令行参数来自定义浏览器行为。有数百个可用选项可用于控制从网络到渲染行为的所有内容。

    常用Chrome配置选项
    
    ```python
    # 性能与行为选项
    options.add_argument('--headless=new')         # 以无头模式运行Chrome
    options.add_argument('--disable-gpu')          # 禁用GPU加速
    options.add_argument('--no-sandbox')           # 禁用沙盒模式（需谨慎使用）
    options.add_argument('--disable-dev-shm-usage') # 解决资源限制问题
    
    # 界面显示选项
    options.add_argument('--start-maximized')      # 以最大化窗口启动
    options.add_argument('--window-size=1920,1080') # 设置特定窗口尺寸
    options.add_argument('--hide-scrollbars')      # 隐藏滚动条
    
    # 网络选项
    options.add_argument('--proxy-server=socks5://127.0.0.1:9050') # 使用代理服务器
    options.add_argument('--disable-extensions')   # 禁用扩展程序
    options.add_argument('--disable-notifications') # 禁用通知
    
    # 隐私与安全
    options.add_argument('--incognito')            # 以隐身模式运行
    options.add_argument('--disable-infobars')     # 禁用信息栏
    ```
    
    完整参考指南
    
    如需获取所有可用的Chrome命令行参数完整列表，请参考以下资源：
    
    - [Chromium Command Line Switches](https://peter.sh/experiments/chromium-command-line-switches/) - Complete reference list
    - [Chrome Flags](chrome://flags) - Enter this in your Chrome browser address bar to see experimental features
    - [Chromium Source Code Flags](https://source.chromium.org/chromium/chromium/src/+/main:chrome/common/chrome_switches.cc) - Direct source code reference
    
    请注意某些选项在不同Chrome版本中可能有差异表现，建议在升级Chrome时测试您的配置。

通过这些配置，您可以在各种环境中运行 Pydoll，包括 CI/CD 流水线、无显示器的服务器或 Docker 容器。

继续阅读文档，探索 Pydoll 在处理验证码、处理多个标签页、与元素交互等方面的强大功能。

## 极简依赖

Pydoll 的优势之一是其轻量级的占用空间。与其他需要大量依赖项的浏览器自动化工具不同，Pydoll 在保留了强大的功能的同时力求精简。  

### 核心依赖

Pydoll仅依赖少量的核心库：  

```
python = "^3.10"
websockets = "^13.1"
aiohttp = "^3.9.5"
aiofiles = "^23.2.1"
bs4 = "^0.0.2"
```

这种极简依赖策略带来五大核心优势：  

- **⚡闪电安装** - 无需解析复杂的依赖树
- **🧩 零冲突** - 与其他包发生版本冲突的概率极低
- **📦 轻量化** - 更低的磁盘空间占用
- **🔒 更好的安全** - 更小的攻击面和供应链漏洞
- **🔄 方便升级** - 方便维护已经无破坏性更新

更少的依赖项带来了： 更高的运行可靠性以及更强的性能表现。

## 顶级赞助商

<a href="https://substack.thewebscraping.club/p/pydoll-webdriver-scraping?utm_source=github&utm_medium=repo&utm_campaign=pydoll" target="_blank" rel="noopener nofollow sponsored">
  <img src="../resources/images/banner-the-webscraping-club.png" alt="The Web Scraping Club" />
</a>

<sub>在 <b><a href="https://substack.thewebscraping.club/p/pydoll-webdriver-scraping?utm_source=github&utm_medium=repo&utm_campaign=pydoll" target="_blank" rel="noopener nofollow sponsored">The Web Scraping Club</a></b> 上阅读 Pydoll 的完整评测，这是排名第一的网页抓取专属通讯。</sub>

## 赞助商

赞助商的支持对于项目的持续发展至关重要。每一份合作都能帮助我们覆盖基础成本、推动新功能迭代，并保证项目长期维护与更新。非常感谢所有相信并支持 Pydoll 的伙伴！

<div class="sponsors-grid">
  <a href="https://www.thordata.com/?ls=github&lk=pydoll" target="_blank" rel="noopener nofollow sponsored">
    <img src="../resources/images/Thordata-logo.png" alt="Thordata" />
  </a>
  <a href="https://www.testmuai.com/?utm_medium=sponsor&utm_source=pydoll" target="_blank" rel="noopener nofollow sponsored">
    <img src="../resources/images/logo-lamda-test.svg" alt="LambdaTest" />
  </a>
  <a href="https://dashboard.capsolver.com/passport/register?inviteCode=WPhTbOsbXEpc" target="_blank" rel="noopener nofollow sponsored">
    <img src="../resources/images/capsolver-logo.png" alt="CapSolver" />
  </a>
</div>

<p>
  <a href="https://github.com/sponsors/thalissonvs" target="_blank" rel="noopener">成为赞助商</a>
</p>

## 许可证

Pydoll 遵循 MIT 许可证（完整文本见 LICENSE 文件），主要授权条款包括：  

1. 权利授予  
   - 永久、全球范围、免版税的使用权  
   - 允许修改创作衍生作品  
   - 可再授权给第三方  

2. 唯一责任限制  
   - 所有修改件必须保留原版权声明  
   - 不提供任何明示或默示担保  

??? info "View Full MIT License Text"
    ```
    MIT License
    
    Copyright (c) 2023 Pydoll Contributors
    
    Permission is hereby granted, free of charge, to any person obtaining a copy
    of this software and associated documentation files (the "Software"), to deal
    in the Software without restriction, including without limitation the rights
    to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
    copies of the Software, and to permit persons to whom the Software is
    furnished to do so, subject to the following conditions:
    
    The above copyright notice and this permission notice shall be included in all
    copies or substantial portions of the Software.
    
    THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
    IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
    FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
    AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
    LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
    OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
    SOFTWARE.
    ```


================================================
FILE: examples/cloudflare_bypass.py
================================================
import asyncio

from pydoll.browser import Chrome


async def example_with_context_manager():
    """
    Example using the context manager approach to handle Cloudflare captcha.

    This waits for the captcha to be processed before continuing.
    """
    browser = Chrome()
    await browser.start()
    page = await browser.get_page()

    print('Using context manager approach...')
    async with page.expect_and_bypass_cloudflare_captcha():
        await page.go_to('https://www.planetminecraft.com/account/sign_in/')
        print('Page loaded, waiting for captcha to be handled...')

    print('Captcha handling completed, now we can continue...')
    await asyncio.sleep(3)
    await browser.stop()


async def example_with_enable_disable():
    """
    Example using the enable/disable approach to handle Cloudflare captcha.

    This enables the auto-solving and continues execution immediately.
    The captcha will be solved in the background when it appears.
    """
    browser = Chrome()
    await browser.start()
    page = await browser.get_page()

    print('Using enable/disable approach...')

    # Enable automatic captcha solving before navigating
    await page.enable_auto_solve_cloudflare_captcha()

    # Navigate to the page - captcha will be handled automatically
    await page.go_to('https://www.planetminecraft.com/account/sign_in/')
    print('Page loaded, captcha will be handled in the background...')

    # Continue with other operations immediately
    # The captcha will be solved in the background when it appears
    await asyncio.sleep(5)

    # Disable auto-solving when no longer needed
    await page.disable_auto_solve_cloudflare_captcha()
    print('Auto-solving disabled')

    await browser.stop()


async def main():
    # Choose which example to run
    await example_with_context_manager()
    # Or uncomment the line below to run the enable/disable example
    # await example_with_enable_disable()


if __name__ == '__main__':
    asyncio.run(main())


================================================
FILE: mkdocs.yml
================================================
site_name: Pydoll - Async Web Automation Library
site_url: https://pydoll.tech/docs/
repo_url: https://github.com/autoscrape-labs/pydoll
repo_name: autoscrape-labs/pydoll
use_directory_urls: true
docs_dir: docs

# Configuração da navegação
nav:
  - Pydoll: index.md
  - Features:
      - Overview: features/index.md
      - Core Concepts: features/core-concepts.md
      - Element Finding: features/element-finding.md
      - Automation:
          - Human-Like Interactions: features/automation/human-interactions.md
          - Keyboard Control: features/automation/keyboard-control.md
          - Mouse Control: features/automation/mouse-control.md
          - File Operations: features/automation/file-operations.md
          - IFrames: features/automation/iframes.md
          - Screenshots & PDF: features/automation/screenshots-and-pdfs.md
      - Network:
          - Network Monitoring: features/network/monitoring.md
          - Request Interception: features/network/interception.md
          - Browser-Context HTTP Requests: features/network/http-requests.md
          - HAR Network Recording: features/network/network-recording.md
      - Browser Management:
          - Multi-Tab Management: features/browser-management/tabs.md
          - Browser Contexts: features/browser-management/contexts.md
          - Cookies & Sessions: features/browser-management/cookies-sessions.md
      - Configuration:
          - Browser Options: features/configuration/browser-options.md
          - Browser Preferences: features/configuration/browser-preferences.md
          - Proxy Configuration: features/configuration/proxy.md
      - Advanced:
          - Behavioral Captcha Bypass: features/advanced/behavioral-captcha-bypass.md
          - Event System: features/advanced/event-system.md
          - Remote Connections: features/advanced/remote-connections.md
          - Retry Decorator: features/advanced/decorators.md
  - Deep Dive:
      - Overview: deep-dive/index.md
      - Core Fundamentals:
          - Overview: deep-dive/fundamentals/index.md
          - Chrome DevTools Protocol: deep-dive/fundamentals/cdp.md
          - Connection Layer: deep-dive/fundamentals/connection-layer.md
          - Python Type System: deep-dive/fundamentals/typing-system.md
          - Iframes & Contexts: deep-dive/fundamentals/iframes-and-contexts.md
      - Internal Architecture:
          - Overview: deep-dive/architecture/index.md
          - Browser Domain: deep-dive/architecture/browser-domain.md
          - Tab Domain: deep-dive/architecture/tab-domain.md
          - WebElement Domain: deep-dive/architecture/webelement-domain.md
          - FindElements Mixin: deep-dive/architecture/find-elements-mixin.md
          - Event Architecture: deep-dive/architecture/event-architecture.md
          - Browser Requests Architecture: deep-dive/architecture/browser-requests-architecture.md
          - Shadow DOM: deep-dive/architecture/shadow-dom.md
      - Network & Security:
          - Overview: deep-dive/network/index.md
          - Network Fundamentals: deep-dive/network/network-fundamentals.md
          - HTTP/HTTPS Proxies: deep-dive/network/http-proxies.md
          - SOCKS Proxies: deep-dive/network/socks-proxies.md
          - Proxy Detection: deep-dive/network/proxy-detection.md
          - Building Proxy Servers: deep-dive/network/build-proxy.md
          - Legal & Ethical: deep-dive/network/proxy-legal.md
      - Fingerprinting:
          - Overview: deep-dive/fingerprinting/index.md
          - Network Fingerprinting: deep-dive/fingerprinting/network-fingerprinting.md
          - Browser Fingerprinting: deep-dive/fingerprinting/browser-fingerprinting.md
          - Behavioral Fingerprinting: deep-dive/fingerprinting/behavioral-fingerprinting.md
          - Evasion Techniques: deep-dive/fingerprinting/evasion-techniques.md
      - Practical Guides:
          - Overview: deep-dive/guides/index.md
          - CSS Selectors vs XPath: deep-dive/guides/selectors-guide.md
  - API Reference:
      - Overview: api/index.md
      - Browser:
          - Chrome: api/browser/chrome.md
          - Edge: api/browser/edge.md
          - Options: api/browser/options.md
          - Tab: api/browser/tab.md
          - Requests: api/browser/requests.md
          - Managers: api/browser/managers.md
      - Elements:
          - WebElement: api/elements/web_element.md
          - ShadowRoot: api/elements/shadow_root.md
          - Mixins: api/elements/mixins.md
      - Connection:
          - Connection Handler: api/connection/connection.md
          - Managers: api/connection/managers.md
      - Commands:
          - Overview: api/commands/index.md
          - Browser: api/commands/browser.md
          - DOM: api/commands/dom.md
          - Input: api/commands/input.md
          - Network: api/commands/network.md
          - Page: api/commands/page.md
          - Runtime: api/commands/runtime.md
          - Storage: api/commands/storage.md
          - Target: api/commands/target.md
          - Fetch: api/commands/fetch.md
      - Protocol:
          - Base Types: api/protocol/base.md
          - Browser: api/protocol/browser.md
          - DOM: api/protocol/dom.md
          - Fetch: api/protocol/fetch.md
          - Input: api/protocol/input.md
          - Network: api/protocol/network.md
          - Page: api/protocol/page.md
          - Runtime: api/protocol/runtime.md
          - Storage: api/protocol/storage.md
          - Target: api/protocol/target.md
      - Core:
          - Constants: api/core/constants.md
          - Exceptions: api/core/exceptions.md
          - Utils: api/core/utils.md

theme:
  name: material
  font:
    text: Roboto
    code: Roboto Mono
  palette:
    - media: "(prefers-color-scheme: dark)"
      scheme: slate
      primary: custom
      accent: indigo
      toggle:
        icon: material/toggle-switch-off-outline
        name: Dark Mode
  
    - media: "(prefers-color-scheme: light)"
      scheme: default
      primary: custom
      accent: indigo
      toggle:
        icon: material/toggle-switch
        name: Light Mode
  icon:
    repo: fontawesome/brands/github
    logo: material/lightning-bolt
  favicon: resources/images/favicon.png
  features:
    - navigation.tabs
    - navigation.tabs.sticky
    - navigation.sections
    - navigation.indexes
    - navigation.expand
    - navigation.path
    - navigation.top
    - toc.follow
    - content.code.copy
    - content.code.select
    - content.tooltips
    - search.highlight
    - search.suggest
  
plugins:
  - search
  - i18n:
      docs_structure: folder
      fallback_to_default: true
      reconfigure_material: false
      reconfigure_search: true
      languages:
        - locale: en
          default: true
          name: English
          build: true
          site_name: "Pydoll - Async Web Automation Library"
        - locale: zh
          name: 中文
          build: true
          site_name: "Pydoll - 异步网页自动化库"
          nav_translations:
            Pydoll: Pydoll
            Features: 特性
            Overview: 概述
            Core Concepts: 核心概念
            Element Finding: 元素查找
            Automation: 自动化
            Human-Like Interactions: 类人交互
            Keyboard Control: 键盘控制
            Mouse Control: 鼠标控制
            File Operations: 文件操作
            IFrames: IFrame交互
            Screenshots & PDF: 截图与PDF
            Network: 网络
            Network Monitoring: 网络监控
            Request Interception: 请求拦截
            Browser-Context HTTP Requests: 浏览器上下文HTTP请求
            HAR Network Recording: HAR网络录制
            Browser Management: 浏览器管理
            Multi-Tab Management: 多标签页管理
            Browser Contexts: 浏览器上下文
            Cookies & Sessions: Cookie与会话
            Configuration: 配置
            Browser Options: 浏览器选项
            Browser Preferences: 浏览器偏好设置
            Proxy Configuration: 代理配置
            Advanced: 高级功能
            Behavioral Captcha Bypass: 行为验证码绕过
            Event System: 事件系统
            Remote Connections: 远程连接
            Retry Decorator: Retry 装饰器
            Deep Dive: 深入了解
            Core Fundamentals: 核心基础
            Chrome DevTools Protocol: Chrome DevTools 协议
            Connection Layer: 连接层
            Python Type System: Python类型系统
            Internal Architecture: 内部架构
            Browser Domain: 浏览器域
            Tab Domain: 标签页域
            WebElement Domain: Web元素域
            FindElements Mixin: 查找元素混合器
            Event Architecture: 事件架构
            Browser Requests Architecture: 浏览器请求架构
            Shadow DOM: Shadow DOM 架构
            Network & Security: 网络与安全
            Network Fundamentals: 网络基础
            HTTP/HTTPS Proxies: HTTP/HTTPS 代理
            SOCKS Proxies: SOCKS 代理
            Proxy Detection: 代理检测
            Building Proxy Servers: 构建代理服务器
            Legal & Ethical: 法律与道德
            Fingerprinting: 指纹识别
            Network Fingerprinting: 网络指纹识别
            Browser Fingerprinting: 浏览器指纹识别
            Behavioral Fingerprinting: 行为指纹识别
            Evasion Techniques: 规避技术
            Practical Guides: 实用指南
            CSS Selectors vs XPath: CSS选择器 vs XPath
            API Reference: API 参考
            Browser: 浏览器
            Chrome: Chrome
            Edge: Edge
            Options: 选项
            Tab: 标签页
            Requests: 请求
            Managers: 管理器
            Elements: 元素
            WebElement: Web元素
            ShadowRoot: Shadow根
            Mixins: 混合器
            Connection: 连接
            Connection Handler: 连接处理器
            Commands: 命令
            DOM: DOM
            Input: 输入
            Network: 网络
            Page: 页面
            Runtime: 运行时
            Storage: 存储
            Target: 目标
            Fetch: 获取
            Protocol: 协议
            Base Types: 基础类型
            Overview: 概述
            Events: 事件
            Browser: 浏览器
            DOM: DOM
            Fetch: 获取
            Input: 输入
            Network: 网络
            Page: 页面
            Runtime: 运行时
            Storage: 存储
            Target: 目标
            Core: 核心
            Constants: 常量
            Exceptions: 异常
            Utils: 工具
        - locale: pt
          name: Português (BR)
          build: true
          site_name: "Pydoll - Biblioteca de Automação Web Assíncrona"
          nav_translations:
            Pydoll: Pydoll
            Features: Recursos
            Overview: Visão Geral
            Core Concepts: Conceitos Fundamentais
            Element Finding: Pesquisa de Elementos
            Automation: Automação
            Human-Like Interactions: Interações Humanas
            Keyboard Control: Controle de Teclado
            Mouse Control: Controle do Mouse
            File Operations: Operações com Arquivos
            IFrames: IFrames
            Screenshots & PDF: Capturas e PDF
            Network: Rede
            Network Monitoring: Monitoramento de Rede
            Request Interception: Interceptação de Requisições
            Browser-Context HTTP Requests: Requisições HTTP no Contexto do Navegador
            HAR Network Recording: Gravação de Rede HAR
            Browser Management: Gerenciamento do Navegador
            Multi-Tab Management: Gerenciamento de Abas
            Browser Contexts: Contextos do Navegador
            Cookies & Sessions: Cookies e Sessões
            Configuration: Configuração
            Browser Options: Opções do Navegador
            Browser Preferences: Preferências do Navegador
            Proxy Configuration: Configuração de Proxy
            Advanced: Avançado
            Behavioral Captcha Bypass: Bypass de Captcha Comportamental
            Event System: Sistema de Eventos
            Remote Connections: Conexões Remotas
            Retry Decorator: Decorator Retry
            Deep Dive: Análise Profunda
            Core Fundamentals: Fundamentos Centrais
            Chrome DevTools Protocol: Protocolo Chrome DevTools
            Connection Layer: Camada de Conexão
            Python Type System: Sistema de Tipos Python
            Internal Architecture: Arquitetura Interna
            Browser Domain: Domínio do Navegador
            Tab Domain: Domínio da Aba
            WebElement Domain: Domínio do WebElement
            FindElements Mixin: Mixin FindElements
            Event Architecture: Arquitetura de Eventos
            Browser Requests Architecture: Arquitetura de Requisições do Navegador
            Shadow DOM: Arquitetura Shadow DOM
            Network & Security: Rede e Segurança
            Network Fundamentals: Fundamentos de Rede
            HTTP/HTTPS Proxies: Proxies HTTP/HTTPS
            SOCKS Proxies: Proxies SOCKS
            Proxy Detection: Detecção de Proxy
            Building Proxy Servers: Construindo Servidores Proxy
            Legal & Ethical: Legal & Ética
            Fingerprinting: Fingerprinting
            Network Fingerprinting: Fingerprinting de Rede
            Browser Fingerprinting: Fingerprinting do Navegador
            Behavioral Fingerprinting: Fingerprinting Comportamental
            Evasion Techniques: Técnicas de Evasão
            Practical Guides: Guias Práticos
            CSS Selectors vs XPath: Seletores CSS vs XPath
            API Reference: Referência da API
            Browser: Navegador
            Chrome: Chrome
            Edge: Edge
            Options: Opções
            Tab: Aba
            Requests: Requisições
            Managers: Gerenciadores
            Elements: Elementos
            WebElement: Elemento Web
            ShadowRoot: Shadow Root
            Mixins: Mixins
            Connection: Conexão
            Connection Handler: Manipulador de Conexão
            Commands: Comandos
            DOM: DOM
            Input: Entrada
            Network: Rede
            Page: Página
            Runtime: Tempo de Execução
            Storage: Armazenamento
            Target: Alvo
            Fetch: Fetch
            Protocol: Protocolo
            Base Types: Tipos Base
            Overview: Visão Geral
            Events: Eventos
            Browser: Navegador
            DOM: DOM
            Fetch: Fetch
            Input: Entrada
            Network: Rede
            Page: Página
            Runtime: Tempo de Execução
            Storage: Armazenamento
            Target: Alvo
            Core: Núcleo
            Constants: Constantes
            Exceptions: Exceções
            Utils: Utilitários
  - mkdocstrings:
      handlers:
        python:
          options:
            show_root_heading: true
            show_if_no_docstring: true
            inherited_members: true
            members_order: source
            separate_signature: true
            filters:
            - '!^_'
            - '!^__'
            merge_init_into_class: true
            docstring_section_style: spacy
            signature_crossrefs: true
            show_symbol_type_heading: true
            show_symbol_type_toc: true
            show_source: false
            show_bases: true
            heading_level: 1

extra:   
  alternate:
    - name: English
      link: /docs/
      lang: en
    - name: Português (BR)
      link: /docs/pt/
      lang: pt
    - name: 中文
      link: /docs/zh/
      lang: zh

extra_css:
  - resources/stylesheets/termynal.css
  - resources/stylesheets/extra.css

extra_javascript:
  - resources/scripts/termynal.js
  - resources/scripts/extra.js
  - https://unpkg.com/mermaid@10.0.0/dist/mermaid.min.js

markdown_extensions:
  - pymdownx.critic
  - pymdownx.highlight:
      anchor_linenums: true
      line_spans: __span
      pygments_lang_class: true
  - pymdownx.inlinehilite
  - pymdownx.snippets
  - pymdownx.superfences:
      custom_fences:
        - name: mermaid
          class: mermaid
          format: !!python/name:pymdownx.superfences.fence_code_format
  - pymdownx.details
  - pymdownx.keys
  - footnotes
  - admonition
  - markdown.extensions.attr_list
  - pymdownx.tabbed:
      alternate_style: true
  - attr_list
  - pymdownx.emoji:
      emoji_index: !!python/name:material.extensions.emoji.twemoji
      emoji_generator: !!python/name:material.extensions.emoji.to_svg
  - md_in_html

================================================
FILE: public/index.html
================================================
<!DOCTYPE html>
<html lang="en">
  <head>
    <meta charset="UTF-8" />
    <meta name="viewport" content="width=device-width, initial-scale=1.0" />
    <meta name="theme-color" content="#0b1220" />
    <title>Pydoll - scraping, the easier way</title>
    <meta name="description" content="Pydoll is a Python browser automation library built on CDP with zero configuration, async performance, intuitive API, and full type safety. Simple, powerful web automation." />
    <meta name="keywords" content="pydoll, browser automation, web automation, web scraping, scraping, data scraping, data extraction, crawler, crawling, headless browser, headless chrome, chrome devtools protocol, devtools protocol, cdp, python cdp, chrome cdp, async python, asyncio, network interception, request interception, browser context requests, http requests browser context, humanized interactions, human-like interactions, automation library, scraping framework, type safety, zero configuration, concurrent automation, browser preferences, downloads, python automation, modern web scraping" />
    <meta name="robots" content="index,follow" />
    <link rel="canonical" href="https://pydoll.tech/" />

    <!-- Open Graph -->
    <meta property="og:title" content="Pydoll - scraping, the easier way" />
    <meta property="og:description" content="Python browser automation with zero configuration, async performance, intuitive API, and full type safety. Simple, powerful web automation." />
    <meta property="og:type" content="website" />
    <meta property="og:image" content="https://pydoll.tech/images/logo.png" />
    <meta property="og:url" content="https://pydoll.tech/" />
    <meta property="og:site_name" content="Pydoll" />
    <meta property="og:locale" content="en_US" />
    <meta property="og:locale:alternate" content="pt_BR" />

    <!-- Twitter Card -->
    <meta name="twitter:card" content="summary_large_image" />
    <meta name="twitter:title" content="Pydoll - scraping, the easier way" />
    <meta name="twitter:description" content="Python browser automation with zero configuration, async performance, intuitive API, and full type safety." />
    <meta name="twitter:image" content="https://pydoll.tech/images/logo.png" />

    <!-- Performance hints -->
    <link rel="preconnect" href="https://cdn.tailwindcss.com" />
    <link rel="preconnect" href="https://cdn.jsdelivr.net" />
    <link rel="preconnect" href="https://pydoll.tech/" />

    <!-- Favicon -->
    <link rel="icon" type="image/png" href="/images/favicon.png" sizes="48x48 32x32 16x16" />
    <link rel="shortcut icon" type="image/png" href="/images/favicon.png" />
    <link rel="apple-touch-icon" href="/images/favicon.png" />

    <!-- Tailwind CSS via CDN -->
    <script src="https://cdn.tailwindcss.com"></script>
    <!-- Schema.org: SoftwareApplication / SoftwareSourceCode -->
    <script type="application/ld+json">
      {
        "@context": "https://schema.org",
        "@graph": [
          {
            "@type": "Organization",
            "@id": "https://pydoll.tech/#org",
            "name": "Pydoll",
            "url": "https://pydoll.tech/",
            "logo": {
              "@type": "ImageObject",
              "url": "https://pydoll.tech/images/logo.png"
            },
            "sameAs": [
              "https://pypi.org/project/pydoll-python/"
            ]
          },
          {
            "@type": "WebSite",
            "@id": "https://pydoll.tech/#website",
            "name": "Pydoll",
            "url": "https://pydoll.tech/",
            "publisher": { "@id": "https://pydoll.tech/#org" },
            "inLanguage": "en",
            "potentialAction": {
              "@type": "SearchAction",
              "target": "https://pydoll.tech/docs/search/?q={search_term_string}",
              "query-input": "required name=search_term_string"
            }
          },
          {
            "@type": "WebPage",
            "@id": "https://pydoll.tech/#webpage",
            "url": "https://pydoll.tech/",
            "name": "Pydoll - scraping, the easier way",
            "isPartOf": { "@id": "https://pydoll.tech/#website" },
            "about": { "@id": "https://pydoll.tech/#software" },
            "description": "Pydoll is a Python CDP browser automation library for web scraping, with zero configuration, async performance, and intuitive API."
          },
          {
            "@type": "SoftwareApplication",
            "@id": "https://pydoll.tech/#software",
            "name": "Pydoll",
            "applicationCategory": "DeveloperApplication",
            "operatingSystem": "Windows, macOS, Linux",
            "programmingLanguage": "Python",
            "url": "https://pydoll.tech/",
            "image": "https://pydoll.tech/images/logo.png",
            "description": "Python library for browser automation via Chrome DevTools Protocol (CDP), with zero configuration, async performance, intuitive API, and full type safety.",
            "publisher": { "@id": "https://pydoll.tech/#org" },
            "offers": {
              "@type": "Offer",
              "price": 0,
              "priceCurrency": "USD"
            },
            "codeRepository": "https://github.com/autoscrape-labs/pydoll",
            "sameAs": [
              "https://pypi.org/project/pydoll-python/"
            ],
            "keywords": [
              "Pydoll",
              "browser automation",
              "web scraping",
              "Chrome DevTools Protocol",
              "async Python",
              "type safety",
              "zero configuration",
              "concurrent automation"
            ],
            "mainEntityOfPage": {"@id":"https://pydoll.tech/#webpage"}
          },
          {
            "@type": "FAQPage",
            "@id": "https://pydoll.tech/#faq",
            "mainEntity": [
              {
                "@type": "Question",
                "name": "What is Pydoll and why doesn't it use WebDriver?",
                "acceptedAnswer": {
                  "@type": "Answer",
                  "text": "Pydoll is a Python library that controls the browser via the Chrome DevTools Protocol (CDP), eliminating WebDrivers. This reduces layers, improves reliability and gives direct access to page events, network interception and JavaScript execution in the real tab context."
                }
              },
              {
                "@type": "Question",
                "name": "What makes Pydoll's setup so simple compared to other automation tools?",
                "acceptedAnswer": {
                  "@type": "Answer",
                  "text": "Just 'pip install pydoll-python' and you're ready. No WebDriver downloads, no PATH configuration, no version matching issues. Pydoll connects directly to Chrome via CDP, eliminating the entire driver layer that causes most automation headaches."
                }
              }
            ]
          }
        ]
      }
      </script>
      
    <script>
      tailwind.config = {
        theme: {
          extend: {
            colors: {
              brand: {
                50: '#eef2ff',
                100: '#e0e7ff',
                200: '#c7d2fe',
                300: '#a5b4fc',
                400: '#818cf8',
                500: '#6366f1',
                600: '#4f46e5',
                700: '#4338ca',
                800: '#3730a3',
                900: '#312e81'
              }
            }
          }
        }
      }
    </script>
    <!-- Prism.js (syntax highlight) -->
    <link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/prismjs@1.29.0/themes/prism-twilight.min.css" />
    <style>
      /* Harmonize code block background with Tailwind bg-slate-950 */
      :root { --code-bg: #020617; }
      html { scroll-behavior: smooth; }
      /* Reveal on scroll */
      .reveal { opacity: 0; transform: translateY(12px); transition: opacity .6s ease, transform .6s ease; will-change: transform, opacity; }
      .revealed { opacity: 1; transform: none; }
      /* Tilt base */
      .tilt-card { transform-style: preserve-3d; transform: perspective(1000px); transition: transform .18s ease, box-shadow .18s ease; }
      .tilt-card:hover { transition: transform .06s ease; }
      pre[class*="language-"], code[class*="language-"] {
        background: var(--code-bg) !important;
        font-size: 13px !important;
        line-height: 1.5 !important;
      }
      pre[class*="language-"] { 
        border: 1px solid rgba(255,255,255,0.1); 
        border-radius: 8px;
        margin: 0;
        overflow-x: auto;
        overflow-y: hidden; /* avoid vertical scrollbar differences (Chrome vs Firefox) */
      }
      /* Remove inner padding from code so pre controls spacing */
      pre[class*="language-"] > code { 
        background: transparent !important; 
        padding: 0;
      }
      /* Ensure syntax highlighting works */
      .token.keyword { color: #c792ea !important; }
      .token.string { color: #c3e88d !important; }
      .token.function { color: #82aaff !important; }
      .token.comment { color: #546e7a !important; }
      .token.operator { color: #89ddff !important; }
      .token.punctuation { color: #89ddff !important; }
      .token.builtin { color: #ffcb6b !important; }
      .token.class-name { color: #ffcb6b !important; }
    </style>
  </head>
  <body class="bg-slate-950 text-slate-100 antialiased">
    <!-- Navbar -->
    <header class="sticky top-0 z-50 backdrop-blur supports-[backdrop-filter]:bg-slate-950/60">
      <div class="mx-auto max-w-7xl px-4 sm:px-6 lg:px-8">
        <div class="flex h-16 items-center justify-between">
          <a href="/" class="flex items-center gap-3">
            <img src="https://pydoll.tech/images/logo.png" alt="Pydoll" class="h-8 w-auto" />
          </a>
          <!-- Desktop nav -->
          <nav class="hidden items-center gap-2 sm:flex sm:gap-3">
            <a href="https://pydoll.tech/docs/" class="px-3 py-2 text-sm font-medium text-slate-200 hover:text-white">Docs</a>
            <a href="#install" class="px-3 py-2 text-sm font-medium text-slate-200 hover:text-white">Install</a>
            <a href="#sponsors" class="px-3 py-2 text-sm font-medium text-slate-200 hover:text-white">Sponsors</a>
            <a href="#faq" class="px-3 py-2 text-sm font-medium text-slate-200 hover:text-white">FAQ</a>
            <a href="https://github.com/sponsors/thalissonvs" target="_blank" rel="noopener" class="px-3 py-2 text-sm font-medium text-slate-200 hover:text-white">Sponsor</a>
            <a href="https://github.com/autoscrape-labs/pydoll" target="_blank" rel="noopener" aria-label="Star on GitHub" class="inline-flex items-center gap-2 rounded-md bg-yellow-500 px-3 py-2 text-sm font-semibold text-slate-900 shadow hover:bg-yellow-400">
              <svg xmlns="http://www.w3.org/2000/svg" class="h-4 w-4" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round"><polygon points="12 2 15 9 22 9 17 14 19 22 12 18 5 22 7 14 2 9 9 9 12 2"/></svg>
              Star
              <span id="starCount" class="hidden rounded px-2 py-0.5 text-slate-900 sm:inline-block">...</span>
            </a>
          </nav>
          <!-- Mobile toggle -->
          <button id="mobileMenuButton" aria-controls="mobileMenu" aria-expanded="false" class="inline-flex items-center justify-center rounded-md p-2 text-slate-200 hover:text-white hover:bg-white/5 focus:outline-none focus:ring-2 focus:ring-brand-500 sm:hidden" type="button">
            <span class="sr-only">Open main menu</span>
            <svg id="iconMenu" xmlns="http://www.w3.org/2000/svg" class="h-6 w-6" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round"><line x1="3" y1="6" x2="21" y2="6"/><line x1="3" y1="12" x2="21" y2="12"/><line x1="3" y1="18" x2="21" y2="18"/></svg>
            <svg id="iconClose" xmlns="http://www.w3.org/2000/svg" class="hidden h-6 w-6" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round"><line x1="18" y1="6" x2="6" y2="18"/><line x1="6" y1="6" x2="18" y2="18"/></svg>
          </button>
        </div>
        <!-- Mobile menu panel -->
        <div id="mobileMenu" class="hidden sm:hidden">
          <div class="space-y-1 border-t border-white/10 py-3">
            <a href="https://pydoll.tech/docs/" class="block rounded-md px-3 py-2 text-sm font-medium text-slate-200 hover:bg-white/5">Docs</a>
            <a href="#install" class="block rounded-md px-3 py-2 text-sm font-medium text-slate-200 hover:bg-white/5">Install</a>
            <a href="#sponsors" class="block rounded-md px-3 py-2 text-sm font-medium text-slate-200 hover:bg-white/5">Sponsors</a>
            <a href="#faq" class="block rounded-md px-3 py-2 text-sm font-medium text-slate-200 hover:bg-white/5">FAQ</a>
            <a href="https://github.com/sponsors/thalissonvs" target="_blank" rel="noopener" class="block rounded-md px-3 py-2 text-sm font-medium text-slate-200 hover:bg-white/5">Sponsor</a>
            <a href="https://github.com/autoscrape-labs/pydoll" target="_blank" rel="noopener" class="mt-2 inline-flex w-full items-center justify-center gap-2 rounded-md bg-yellow-500 px-3 py-2 text-sm font-semibold text-slate-900 shadow hover:bg-yellow-400"><svg xmlns="http://www.w3.org/2000/svg" class="h-4 w-4" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round"><polygon points="12 2 15 9 22 9 17 14 19 22 12 18 5 22 7 14 2 9 9 9 12 2"/></svg> Star</a>
          </div>
        </div>
      </div>
    </header>

    <!-- Hero -->
    <section id="hero" class="relative overflow-hidden">
      <div id="heroGradient" class="pointer-events-none absolute inset-0 -z-10 h-full bg-gradient-to-b from-indigo-600/30 via-fuchsia-600/10 to-transparent blur-3xl"></div>
      <div id="cursorGlow" aria-hidden="true" class="pointer-events-none absolute -z-10 hidden h-72 w-72 rounded-full bg-gradient-to-tr from-brand-500/25 via-fuchsia-500/15 to-transparent blur-3xl sm:block" style="left:0;top:0;"></div>
      <div class="mx-auto max-w-7xl px-4 pb-12 pt-16 sm:pb-16 sm:pt-24 lg:flex lg:items-start lg:gap-12 lg:px-8">
        <div class="mx-auto max-w-2xl lg:mx-0 lg:flex-auto">
          <h1 class="text-4xl font-bold tracking-tight sm:text-6xl">
            Pydoll: scraping, the easier way
          </h1>
          <p class="mt-6 text-lg leading-8 text-slate-300">
            Built from scratch with zero configuration complexity, Pydoll connects directly to the Chrome DevTools Protocol. 
            No WebDrivers, no setup headaches - just async performance, intuitive API, and full type safety.
          </p>
          <div class="mt-8 flex flex-col gap-3 sm:flex-row sm:items-center">
            <a href="https://github.com/autoscrape-labs/pydoll" target="_blank" rel="noopener" class="inline-flex items-center justify-center gap-2 rounded-md bg-yellow-500 px-5 py-3 text-base font-semibold text-slate-900 shadow hover:bg-yellow-400">
              <svg xmlns="http://www.w3.org/2000/svg" class="h-5 w-5" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round"><polygon points="12 2 15 9 22 9 17 14 19 22 12 18 5 22 7 14 2 9 9 9 12 2"/></svg>
              Star on GitHub
            </a>
            <a href="https://pydoll.tech/docs/" class="inline-flex items-center justify-center gap-2 rounded-md border border-white/10 px-5 py-3 text-base font-semibold text-white/90 hover:bg-white/5">
              📖 View Documentation
            </a>
            <a href="#install" class="inline-flex items-center justify-center gap-2 rounded-md bg-slate-800 px-5 py-3 text-base font-semibold text-white/90 hover:bg-slate-700">
              ⬇️ Install via pip
            </a>
          </div>
          
        </div>
        <div class="mt-12 w-full lg:mt-0 lg:max-w-xl lg:flex-none reveal">
          <div class="tilt-card relative overflow-hidden rounded-xl border border-white/10 bg-slate-900/40 p-6 shadow-xl">
            <div class="space-y-4">
              <div class="flex items-center gap-3">
              </div>
              <div class="rounded-lg bg-slate-950 p-0">
                <iframe 
                  class="w-full aspect-video rounded-lg" 
                  src="https://www.youtube.com/embed/sSw5dS3dQ8k" 
                  title="YouTube video player" 
                  frameborder="0" 
                  allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture" 
                  allowfullscreen>
                </iframe>
              </div>
              <div class="flex items-center justify-between text-xs text-slate-400">
                <span>✨ Simple, powerful, async</span>
                <span>🚀 Ready in seconds</span>
              </div>
            </div>
          </div>
        </div>
      </div>
    </section>

    <!-- Quick Intro / Features -->
    <section class="mx-auto max-w-7xl px-4 pt-10 pb-6 sm:px-6 lg:px-8">
      <div class="grid gap-6 sm:grid-cols-2 lg:grid-cols-3">
        <div id="cardZeroConfig" role="button" aria-controls="modalZeroConfig" class="reveal tilt-card cursor-pointer rounded-xl border border-white/10 bg-slate-900/40 p-6 transition-transform duration-200 hover:bg-white/5">
          <h3 class="flex items-center gap-2 text-lg font-semibold">
            <svg class="h-5 w-5 text-slate-300" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="1.5" stroke-linecap="round" stroke-linejoin="round" aria-hidden="true">
              <circle cx="12" cy="12" r="9"></circle>
              <line x1="5" y1="5" x2="19" y2="19"></line>
            </svg>
            <span>Zero Configuration</span>
          </h3>
          <p class="mt-2 text-sm text-slate-300">Install and automate immediately. No drivers, no PATH variables, no setup hell.</p>
        </div>
        <div id="cardAsync" role="button" aria-controls="modalAsync" class="reveal tilt-card cursor-pointer rounded-xl border border-white/10 bg-slate-900/40 p-6 transition-transform duration-200 hover:bg-white/5">
          <h3 class="flex items-center gap-2 text-lg font-semibold">
            <svg class="h-5 w-5 text-slate-300" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="1.5" stroke-linecap="round" stroke-linejoin="round" aria-hidden="true">
              <polyline points="8,7 4,12 8,17"></polyline>
              <polyline points="16,7 20,12 16,17"></polyline>
            </svg>
            <span>Async by Design</span>
          </h3>
          <p class="mt-2 text-sm text-slate-300">Built for concurrent automation with true async/await support from day one.</p>
        </div>
        <div id="cardTypeSafety" role="button" aria-controls="modalTypeSafety" class="reveal tilt-card cursor-pointer rounded-xl border border-white/10 bg-slate-900/40 p-6 transition-transform duration-200 hover:bg-white/5">
          <h3 class="flex items-center gap-2 text-lg font-semibold">
            <svg class="h-5 w-5 text-slate-300" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="1.5" stroke-linecap="round" stroke-linejoin="round" aria-hidden="true">
              <path d="M9 12l2 2 4-4"></path>
              <path d="M21 12c0 4.97-4.03 9-9 9s-9-4.03-9-9 4.03-9 9-9c1.7 0 3.28.47 4.64 1.28"></path>
            </svg>
            <span>Full Type Safety</span>
          </h3>
          <p class="mt-2 text-sm text-slate-300">Complete type annotations. Your IDE knows exactly what each method returns.</p>
        </div>
        <div id="cardRequests" role="button" aria-controls="modalRequests" class="reveal tilt-card cursor-pointer rounded-xl border border-white/10 bg-slate-900/40 p-6 transition-transform duration-200 hover:bg-white/5">
          <h3 class="flex items-center gap-2 text-lg font-semibold">
            <svg class="h-5 w-5 text-slate-300" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="1.5" stroke-linecap="round" stroke-linejoin="round" aria-hidden="true">
              <circle cx="12" cy="12" r="9"></circle>
              <ellipse cx="12" cy="12" rx="4" ry="9"></ellipse>
              <line x1="3" y1="12" x2="21" y2="12"></line>
            </svg>
            <span>Browser-context requests</span>
          </h3>
          <p class="mt-2 text-sm text-slate-300">Use <code>tab.request</code> to automatically inherit cookies, CORS and session state.</p>
        </div>
        <div id="cardIntuitive" role="button" aria-controls="modalIntuitive" class="reveal tilt-card cursor-pointer rounded-xl border border-white/10 bg-slate-900/40 p-6 transition-transform duration-200 hover:bg-white/5">
          <h3 class="flex items-center gap-2 text-lg font-semibold">
            <svg class="h-5 w-5 text-slate-300" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="1.5" stroke-linecap="round" stroke-linejoin="round" aria-hidden="true">
              <line x1="12" y1="6" x2="12" y2="18"></line>
              <line x1="6" y1="12" x2="18" y2="12"></line>
              <circle cx="12" cy="12" r="1.5"></circle>
            </svg>
            <span>Intuitive API</span>
          </h3>
          <p class="mt-2 text-sm text-slate-300">Element finding feels like natural language. Simple, readable automation code.</p>
        </div>
        <div id="cardEvents" role="button" aria-controls="modalEvents" class="reveal tilt-card cursor-pointer rounded-xl border border-white/10 bg-slate-900/40 p-6 transition-transform duration-200 hover:bg-white/5">
          <h3 class="flex items-center gap-2 text-lg font-semibold">
            <svg class="h-5 w-5 text-slate-300" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="1.5" stroke-linecap="round" stroke-linejoin="round" aria-hidden="true">
              <polyline points="3,12 8,12 10,8 12,16 14,12 21,12"></polyline>
            </svg>
            <span>Event-driven automation</span>
          </h3>
          <p class="mt-2 text-sm text-slate-300">React to page, network and runtime events in real-time.</p>
        </div>
      </div>
    </section>

    <!-- Feature Modals -->
    <div id="modalZeroConfig" class="fixed inset-0 z-[999] hidden items-center justify-center bg-black/70 p-4">
      <div class="relative w-full max-w-3xl rounded-xl border border-white/10 bg-slate-900 p-4 sm:p-6 shadow-2xl">
        <button id="closeZeroConfigModal" aria-label="Close" class="absolute right-3 top-3 rounded-full border border-white/10 bg-slate-800/80 p-1.5 text-slate-300 hover:bg-slate-700 hover:text-white">
          <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="h-4 w-4"><line x1="18" y1="6" x2="6" y2="18"/><line x1="6" y1="6" x2="18" y2="18"/></svg>
        </button>
        <div class="mb-3 flex items-center justify-between pr-10">
          <h4 class="text-lg font-semibold">Zero Configuration</h4>
        </div>
        <p class="mb-3 text-sm text-slate-300">Install and automate with a single command. No drivers, no PATH, no setup hell.</p>
        <pre id="zeroConfigCode" class="language-python overflow-x-auto rounded-lg border border-white/10 bg-slate-950 p-4"><code class="language-python">from pydoll.browser import Chrome

async def run():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://example.com')
</code></pre>
      </div>
    </div>

    <div id="modalAsync" class="fixed inset-0 z-[999] hidden items-center justify-center bg-black/70 p-4">
      <div class="relative w-full max-w-3xl rounded-xl border border-white/10 bg-slate-900 p-4 sm:p-6 shadow-2xl">
        <button id="closeAsyncModal" aria-label="Close" class="absolute right-3 top-3 rounded-full border border-white/10 bg-slate-800/80 p-1.5 text-slate-300 hover:bg-slate-700 hover:text-white">
          <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="h-4 w-4"><line x1="18" y1="6" x2="6" y2="18"/><line x1="6" y1="6" x2="18" y2="18"/></svg>
        </button>
        <div class="mb-3 flex items-center justify-between pr-10">
          <h4 class="text-lg font-semibold">Async by Design</h4>
        </div>
        <p class="mb-3 text-sm text-slate-300">Run multiple tabs concurrently with true async/await.</p>
        <pre id="asyncCode" class="language-python overflow-x-auto rounded-lg border border-white/10 bg-slate-950 p-4"><code class="language-python">import asyncio
from pydoll.browser import Chrome

async def scrape(url, tab):
    await tab.go_to(url)
    return await tab.execute_script('return document.title')

async def main():
    browser = Chrome()
    tab1 = await browser.start()
    tab2 = await browser.new_tab()
    titles = await asyncio.gather(
        scrape('https://google.com', tab1),
        scrape('https://github.com', tab2),
    )
    print(titles)
</code></pre>
      </div>
    </div>

    <div id="modalTypeSafety" class="fixed inset-0 z-[999] hidden items-center justify-center bg-black/70 p-4">
      <div class="relative w-full max-w-3xl rounded-xl border border-white/10 bg-slate-900 p-4 sm:p-6 shadow-2xl">
        <button id="closeTypeSafetyModal" aria-label="Close" class="absolute right-3 top-3 rounded-full border border-white/10 bg-slate-800/80 p-1.5 text-slate-300 hover:bg-slate-700 hover:text-white">
          <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="h-4 w-4"><line x1="18" y1="6" x2="6" y2="18"/><line x1="6" y1="6" x2="18" y2="18"/></svg>
        </button>
        <div class="mb-3 flex items-center justify-between pr-10">
          <h4 class="text-lg font-semibold">Full Type Safety</h4>
        </div>
        <p class="mb-3 text-sm text-slate-300">Your IDE knows exactly what each call returns.</p>
        <pre id="typeSafetyCode" class="language-python overflow-x-auto rounded-lg border border-white/10 bg-slate-950 p-4"><code class="language-python"># The IDE knows exactly what each call returns:
await tab.find(id='username')                 # → WebElement
await tab.find(id='username', find_all=True)  # → list[WebElement]
await tab.find(id='username', raise_exc=False)  # → WebElement | None
</code></pre>
      </div>
    </div>

    <div id="modalRequests" class="fixed inset-0 z-[999] hidden items-center justify-center bg-black/70 p-4">
      <div class="relative w-full max-w-3xl rounded-xl border border-white/10 bg-slate-900 p-4 sm:p-6 shadow-2xl">
        <button id="closeRequestsModal" aria-label="Close" class="absolute right-3 top-3 rounded-full border border-white/10 bg-slate-800/80 p-1.5 text-slate-300 hover:bg-slate-700 hover:text-white">
          <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="h-4 w-4"><line x1="18" y1="6" x2="6" y2="18"/><line x1="6" y1="6" x2="18" y2="18"/></svg>
        </button>
        <div class="mb-3 flex items-center justify-between pr-10">
          <h4 class="text-lg font-semibold">Browser-context requests</h4>
        </div>
        <p class="mb-3 text-sm text-slate-300">Perform HTTP in the same context as the tab: cookies, session and CORS are inherited automatically.</p>
        <pre id="requestsModalCode" class="language-python overflow-x-auto rounded-lg border border-white/10 bg-slate-950 p-4"><code class="language-python">await tab.go_to('https://app.example.com/login')
await (await tab.find(id='email')).type_text('user@example.com')
await (await tab.find(id='password')).type_text('secret')
await (await tab.find(type='submit')).click()

response = await tab.request.get('https://app.example.com/api/user/profile')
print(response.json())
</code></pre>
      </div>
    </div>

    <div id="modalIntuitive" class="fixed inset-0 z-[999] hidden items-center justify-center bg-black/70 p-4">
      <div class="relative w-full max-w-3xl rounded-xl border border-white/10 bg-slate-900 p-4 sm:p-6 shadow-2xl">
        <button id="closeIntuitiveModal" aria-label="Close" class="absolute right-3 top-3 rounded-full border border-white/10 bg-slate-800/80 p-1.5 text-slate-300 hover:bg-slate-700 hover:text-white">
          <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="h-4 w-4"><line x1="18" y1="6" x2="6" y2="18"/><line x1="6" y1="6" x2="18" y2="18"/></svg>
        </button>
        <div class="mb-3 flex items-center justify-between pr-10">
          <h4 class="text-lg font-semibold">Intuitive API</h4>
        </div>
        <p class="mb-3 text-sm text-slate-300">Readable element finding using attributes, CSS or XPath.</p>
        <pre id="intuitiveCode" class="language-python overflow-x-auto rounded-lg border border-white/10 bg-slate-950 p-4"><code class="language-python">button = await tab.find(tag_name='button', text='Submit', class_name='btn-primary')
await button.click()

el = await tab.query('div[data-testid="awesome-element"]')
</code></pre>
      </div>
    </div>

    <div id="modalEvents" class="fixed inset-0 z-[999] hidden items-center justify-center bg-black/70 p-4">
      <div class="relative w-full max-w-3xl rounded-xl border border-white/10 bg-slate-900 p-4 sm:p-6 shadow-2xl">
        <button id="closeEventsModal" aria-label="Close" class="absolute right-3 top-3 rounded-full border border-white/10 bg-slate-800/80 p-1.5 text-slate-300 hover:bg-slate-700 hover:text-white">
          <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="h-4 w-4"><line x1="18" y1="6" x2="6" y2="18"/><line x1="6" y1="6" x2="18" y2="18"/></svg>
        </button>
        <div class="mb-3 flex items-center justify-between pr-10">
          <h4 class="text-lg font-semibold">Event-driven automation</h4>
        </div>
        <p class="mb-3 text-sm text-slate-300">React to page and network changes in real-time using the built-in event system.</p>
        <pre id="eventsCode" class="language-python overflow-x-auto rounded-lg border border-white/10 bg-slate-950 p-4"><code class="language-python"># Enable and listen to network events
await tab.enable_network_events()

async def on_response(params):
    info = params.get('response', {})
    print('status:', info.get('status'))

await tab.on('Network.responseReceived', on_response)
</code></pre>
      </div>
    </div>

    <!-- Stars Goal Section -->
    <section id="stars-goal" class="mx-auto max-w-7xl px-4 py-12 sm:px-6 lg:px-8">
      <div class="reveal rounded-xl border border-white/10 bg-slate-900/60 p-5 sm:p-6 transition-transform duration-200 hover:shadow-[0_10px_30px_rgba(99,102,241,0.15)]">
        <div class="flex flex-col gap-4 sm:flex-row sm:items-center sm:justify-between">
          <div class="min-w-0">
            <h3 class="text-xl font-semibold">Help us reach 10k stars</h3>
            <p class="mt-1 text-sm text-slate-300">🚀 Your star means more features, more contributors, and a stronger community.</p>
            <div class="mt-4">
              <div class="flex items-center justify-between text-xs text-slate-400">
                <span id="starsProgressLabel">0 / 10,000</span>
                <span id="starsProgressPct">0%</span>
              </div>
              <div class="mt-2 h-2 w-full rounded-full bg-white/10 overflow-hidden">
                <div id="starsProgressBar" class="h-2 rounded-full bg-brand-500" style="width:0%"></div>
              </div>
            </div>
          </div>
          <div class="flex flex-col items-start sm:items-end gap-3">
            <div class="min-w-[220px]">
              <p class="text-xs font-medium text-slate-300">Latest stargazers</p>
              <ul id="stargazersList" class="mt-2 flex flex-wrap items-center gap-2">
                <!-- Filled via JS -->
              </ul>
            </div>
          </div>
        </div>
      </div>
    </section>
    <!-- Install CTA -->
    <section id="install" class="overflow-x-hidden">
      <div class="mx-auto max-w-7xl px-4 py-10 sm:px-6 lg:px-8">
        <div class="grid grid-cols-1 items-center gap-8 lg:grid-cols-2">
          <div class="min-w-0">
            <h2 class="text-2xl font-bold tracking-tight">Install and get started in seconds</h2>
            <p class="mt-3 text-slate-300">No complex setup. Install, import and automate.</p>
            <div class="mt-6 rounded-lg border border-white/10 bg-slate-950 p-3 sm:p-4">
              <div class="flex items-center gap-3 flex-wrap sm:flex-nowrap">
                <code id="installCmd" class="text-sm block max-w-full whitespace-nowrap overflow-x-auto">pip install pydoll-python</code>
                <button id="copyBtn" class="shrink-0 rounded-md bg-slate-800 px-3 py-1.5 text-xs font-semibold text-slate-100 hover:bg-slate-700">Copy</button>
              </div>
            </div>
            <!-- Quick code example -->
            <div class="mt-6">
              <p class="mb-2 text-sm text-slate-300">Quick example:</p>
              <pre class="language-python overflow-x-auto max-w-full rounded-lg border border-white/10 bg-slate-950 p-4"><code class="language-python">import asyncio
from pydoll.browser import Chrome

async def main():
    async with Chrome() as browser:
        tab = await browser.start()
        await tab.go_to('https://google.com')
        
        search_box = await tab.find(name='q')
        await search_box.type_text('Pydoll')
        await search_box.press_keyboard_key('Enter')

asyncio.run(main())
</code></pre>
            </div>
            <div class="mt-6 flex flex-wrap gap-3">
              <a href="https://pydoll.tech/docs/" target="_blank" rel="noopener" class="inline-flex items-center justify-center gap-2 rounded-md bg-white px-4 py-2 text-sm font-semibold text-slate-900 hover:bg-slate-200">Read the docs</a>
              <a href="https://github.com/sponsors/thalissonvs" target="_blank" rel="noopener" class="inline-flex items-center justify-center gap-2 rounded-md border border-white/10 px-4 py-2 text-sm font-semibold text-white/90 hover:bg-white/5">Support the project</a>
            </div>
          </div>
          <div class="reveal rounded-xl p-6 shadow-xl h-full flex flex-col justify-between">
            <div class="space-y-6">
              <div class="text-center space-y-4">
                <div class="mx-auto h-16 w-16 rounded-full bg-brand-500/10 flex items-center justify-center">
                  <svg class="h-8 w-8 text-brand-400" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round">
                    <polyline points="8,7 4,12 8,17"></polyline>
                    <polyline points="16,7 20,12 16,17"></polyline>
                  </svg>
                </div>
                <h3 class="text-lg font-semibold text-slate-200">Zero to automation in seconds</h3>
                <p class="text-sm text-slate-300">Install once, automate forever.<br/>No drivers, no config, no headaches.</p>
              </div>
              
              <div class="space-y-4 border border-white/10 pt-4 p-4 rounded-lg">
                <div class="flex items-start gap-3">
                  <div class="h-2 w-2 rounded-full bg-green-400 mt-1.5"></div>
                  <div class="flex-1">
                    <h4 class="text-sm font-medium text-slate-200">Async by design</h4>
                    <p class="text-xs text-slate-400 mt-1">Built for concurrent automation with true async/await support</p>
                  </div>
                </div>
                <div class="flex items-start gap-3">
                  <div class="h-2 w-2 rounded-full bg-blue-400 mt-1.5"></div>
                  <div class="flex-1">
                    <h4 class="text-sm font-medium text-slate-200">Type safe</h4>
                    <p class="text-xs text-slate-400 mt-1">Complete type annotations - your IDE knows exactly what each method returns</p>
                  </div>
                </div>
                <div class="flex items-start gap-3">
                  <div class="h-2 w-2 rounded-full bg-purple-400 mt-1.5"></div>
                  <div class="flex-1">
                    <h4 class="text-sm font-medium text-slate-200">CDP direct</h4>
                    <p class="text-xs text-slate-400 mt-1">No WebDrivers, no compatibility issues - direct Chrome connection</p>
                  </div>
                </div>
                <div class="flex items-start gap-3">
                  <div class="h-2 w-2 rounded-full bg-yellow-400 mt-1.5"></div>
                  <div class="flex-1">
                    <h4 class="text-sm font-medium text-slate-200">Intuitive API</h4>
                    <p class="text-xs text-slate-400 mt-1">Element finding feels like natural language - simple and readable</p>
                  </div>
                </div>
              </div>
            </div>

          </div>
        </div>
      </div>
    </section>


    <!-- Sponsors -->
    <section id="sponsors" class="mx-auto max-w-7xl px-4 py-10 sm:px-6 lg:px-8">
      <div class="reveal rounded-xl border border-white/10 bg-slate-900/60 p-5 sm:p-6">
        <div class="flex flex-col gap-4 sm:flex-row sm:items-center sm:justify-between">
          <div>
            <h2 class="text-2xl font-bold tracking-tight">Sponsors</h2>
            <p class="mt-1 text-sm text-slate-300">Companies and partners supporting Pydoll.</p>
          </div>
          <div>
            <a href="https://github.com/sponsors/thalissonvs" target="_blank" rel="noopener" class="inline-flex items-center gap-2 rounded-md bg-yellow-500 px-3 py-2 text-sm font-semibold text-slate-900 hover:bg-yellow-400">Become a sponsor</a>
          </div>
        </div>
        <ul id="sponsorsGrid" class="mt-6 grid grid-cols-2 sm:grid-cols-3 md:grid-cols-4 lg:grid-cols-5 gap-3 sm:gap-4 items-center"></ul>
      </div>
    </section>


    <!-- FAQ (near footer) -->
    <section id="faq" class="mx-auto max-w-7xl px-4 pt-4 pb-10 sm:px-6 lg:px-8">
        <div class="mb-6">
          <h2 class="text-2xl font-bold tracking-tight">Frequently asked questions</h2>
          <p class="mt-1 text-sm text-slate-300">Top questions about Pydoll, its features and use cases.</p>
        </div>
        <div class="grid gap-3 sm:gap-4 ">
          <details class="group rounded-lg border border-white/10 bg-slate-900/40 p-4 hover:shadow-[0_10px_30px_rgba(99,102,241,0.15)]">
            <summary class="flex cursor-pointer list-none items-center gap-2 font-medium text-slate-200">
              <svg class="h-4 w-4 text-slate-400 group-open:rotate-90 transition-transform" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" aria-hidden="true"><polyline points="9 18 15 12 9 6"/></svg>
              What is Pydoll and why doesn't it use WebDriver?
            </summary>
            <p class="mt-2 text-sm text-slate-300">Pydoll is a Python library that controls the browser via the <strong>Chrome DevTools Protocol (CDP)</strong>, eliminating WebDrivers. This reduces layers, improves reliability and gives direct access to advanced capabilities like page events, network interception and JavaScript execution in the real tab context.</p>
          </details>
          <details class="group rounded-lg border border-white/10 bg-slate-900/40 p-4 hover:shadow-[0_10px_30px_rgba(99,102,241,0.15)]">
            <summary class="flex cursor-pointer list-none items-center gap-2 font-medium text-slate-200">
              <svg class="h-4 w-4 text-slate-400 group-open:rotate-90 transition-transform" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" aria-hidden="true"><polyline points="9 18 15 12 9 6"/></svg>
              How does Pydoll's type safety work in practice?
            </summary>
            <p class="mt-2 text-sm text-slate-300">Every method is fully typed with precise return annotations. Your IDE knows that <code>await tab.find(id='btn')</code> returns <code>WebElement</code>, <code>find_all=True</code> returns <code>list[WebElement]</code>, and <code>raise_exc=False</code> returns <code>WebElement | None</code>. This eliminates guesswork and catches errors before runtime.</p>
          </details>
          <details class="group rounded-lg border border-white/10 bg-slate-900/40 p-4 hover:shadow-[0_10px_30px_rgba(99,102,241,0.15)]">
            <summary class="flex cursor-pointer list-none items-center gap-2 font-medium text-slate-200">
              <svg class="h-4 w-4 text-slate-400 group-open:rotate-90 transition-transform" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" aria-hidden="true"><polyline points="9 18 15 12 9 6"/></svg>
              What are “browser‑context requests” and when to use them?
            </summary>
            <p class="mt-2 text-sm text-slate-300">With <code>tab.request</code> you perform HTTP in the <strong>same context</strong> as the tab: cookies, session, headers and CORS are automatically inherited. Ideal for hybrid automation: log in via UI and then call the app's authenticated APIs with simplicity and speed.</p>
          </details>
          <details class="group rounded-lg border border-white/10 bg-slate-900/40 p-4 hover:shadow-[0_10px_30px_rgba(99,102,241,0.15)]">
            <summary class="flex cursor-pointer list-none items-center gap-2 font-medium text-slate-200">
              <svg class="h-4 w-4 text-slate-400 group-open:rotate-90 transition-transform" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" aria-hidden="true"><polyline points="9 18 15 12 9 6"/></svg>
              What makes Pydoll's setup so simple compared to other tools?
            </summary>
            <p class="mt-2 text-sm text-slate-300">Just <code>pip install pydoll-python</code> and you're ready. No WebDriver downloads, no PATH configuration, no version matching hell. Pydoll connects directly to Chrome via CDP, eliminating the entire driver layer that causes most automation headaches.</p>
          </details>
          <details class="group rounded-lg border border-white/10 bg-slate-900/40 p-4 hover:shadow-[0_10px_30px_rgba(99,102,241,0.15)]">
            <summary class="flex cursor-pointer list-none items-center gap-2 font-medium text-slate-200">
              <svg class="h-4 w-4 text-slate-400 group-open:rotate-90 transition-transform" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" aria-hidden="true"><polyline points="9 18 15 12 9 6"/></svg>
              How does concurrent automation work with multiple tabs?
            </summary>
            <p class="mt-2 text-sm text-slate-300">Pydoll is async-first, so you can run multiple tabs simultaneously with <code>asyncio.gather</code>. Create tabs with <code>await browser.new_tab()</code>, then process them in parallel. Each tab maintains its own session and state, giving you true concurrent automation without complexity.</p>
          </details>
        </div>
      </section>
    
    <!-- Final CTA (full width) -->
    <section class="mx-auto max-w-7xl px-4 pb-10 sm:px-6 lg:px-8">
      <div class="reveal rounded-xl border border-white/10 bg-slate-900/60 p-5 sm:p-6">
        <div class="flex flex-col gap-4 sm:flex-row sm:items-center sm:justify-between">
          <div>
          <h4 class="text-lg font-semibold">Enjoying Pydoll?</h4>
          <p class="mt-1 text-sm text-slate-200/90">Star it, contribute to the repo or sponsor the development.</p>
          </div>
          <div class="flex flex-wrap gap-2">
            <a href="https://github.com/autoscrape-labs/pydoll" target="_blank" rel="noopener" class="inline-flex items-center gap-2 rounded-md bg-yellow-500 px-3 py-2 text-sm font-semibold text-slate-900 hover:bg-yellow-400">⭐ Star</a>
            <a href="https://github.com/autoscrape-labs/pydoll/blob/main/CONTRIBUTING.md" target="_blank" rel="noopener" class="inline-flex items-center gap-2 rounded-md border border-white/10 px-3 py-2 text-sm font-semibold text-white/90 hover:bg-white/5">👩‍💻 Contribute</a>
            <a href="https://github.com/sponsors/thalissonvs" target="_blank" rel="noopener" class="inline-flex items-center gap-2 rounded-md bg-yellow-500 px-3 py-2 text-sm font-semibold text-slate-900 hover:bg-yellow-400">💖 Sponsor</a>
          </div>
        </div>
      </div>
    </section>

    <!-- Footer -->
    <footer class="border-t border-white/10">
      <div class="mx-auto max-w-7xl px-4 py-10 sm:px-6 lg:px-8">
        <div class="flex flex-col items-center justify-between gap-4 sm:flex-row">
          <div class="flex items-center gap-3">
            <img src="https://pydoll.tech/images/logo.png" alt="Pydoll" class="h-6 w-auto" />
            <p class="text-sm text-slate-400">Pydoll - making web automation simple and powerful</p>
          </div>
          <div class="flex items-center gap-3 text-sm text-slate-400">
            <a href="https://github.com/autoscrape-labs/pydoll" target="_blank" rel="noopener" class="hover:text-white">GitHub</a>
            <span aria-hidden="true">·</span>
            <a href="https://pydoll.tech/docs/" class="hover:text-white">Docs</a>
            <span aria-hidden="true">·</span>
            <a href="https://github.com/sponsors/thalissonvs" target="_blank" rel="noopener" class="hover:text-white">Sponsor</a>
          </div>
        </div>
      </div>
    </footer>

    <!-- JS -->
    <script src="https://cdn.jsdelivr.net/npm/prismjs@1.29.0/prism.min.js"></script>
    <script src="https://cdn.jsdelivr.net/npm/prismjs@1.29.0/components/prism-python.min.js"></script>
    <script>
      // Force Prism highlighting after DOM load
      document.addEventListener('DOMContentLoaded', function() {
        if (typeof Prism !== 'undefined') {
          Prism.highlightAll();
        }
      });
    </script>
    <script src="./script.js" defer></script>
  </body>
  </html>


================================================
FILE: public/robots.txt
================================================
User-agent: *
Disallow: /docs/search/
Disallow: /docs/404.html

Sitemap: https://pydoll.tech/sitemap.xml
Sitemap: https://pydoll.tech/docs/sitemap.xml

================================================
FILE: public/script.js
================================================
// Fetch stars and forks from GitHub API and wire small UX actions
(async () => {
  const repo = 'autoscrape-labs/pydoll'
  const apiUrl = `https://api.github.com/repos/${repo}`
  let repoStarsCount = 0

  // Simple localStorage cache with TTL
  const cacheGet = (key, maxAgeMs) => {
    try {
      const raw = localStorage.getItem(key)
      if (!raw) return null
      const parsed = JSON.parse(raw)
      if (!parsed || typeof parsed !== 'object') return null
      if (typeof parsed.t !== 'number') return null
      const now = Date.now()
      if (now - parsed.t > maxAgeMs) return null
      return parsed.v
    } catch (_) {
      return null
    }
  }
  const cacheSet = (key, value) => {
    try {
      localStorage.setItem(key, JSON.stringify({ t: Date.now(), v: value }))
    } catch (_) {}
  }
  const TTL = 5 * 60 * 1000 // 5 minutes

  // Cursor glow effect (subtle follow)
  const glow = document.getElementById('cursorGlow')
  const hero = document.getElementById('hero')
  if (glow && hero) {
    let raf = 0
    let targetX = 0
    let targetY = 0
    let currentX = 0
    let currentY = 0

    const getHeroRect = () => hero.getBoundingClientRect()

    const reduceMotion = window.matchMedia('(prefers-reduced-motion: reduce)').matches

    const move = (e) => {
      const r = getHeroRect()
      // Coordenadas relativas à seção do herói
      targetX = e.clientX - r.left - glow.offsetWidth / 2
      targetY = e.clientY - r.top - glow.offsetHeight / 2
      if (!raf && !reduceMotion) raf = requestAnimationFrame(tick)
    }
    const tick = () => {
      const lerp = (a, b, t) => a + (b - a) * t
      currentX = lerp(currentX, targetX, 0.18)
      currentY = lerp(currentY, targetY, 0.18)
      glow.style.transform = `translate(${currentX}px, ${currentY}px)`
      raf = (Math.abs(currentX - targetX) + Math.abs(currentY - targetY) > 0.5) ? requestAnimationFrame(tick) : (raf = 0)
    }
    hero.addEventListener('mousemove', move, { passive: true })
  }

  // Stars, goal progress and latest stargazers
  try {
    const cacheKey = `gh:repo:${repo}`
    let data = cacheGet(cacheKey, TTL)
    if (!data) {
      const res = await fetch(apiUrl, { headers: { 'Accept': 'application/vnd.github+json' } })
      if (res.ok) {
        data = await res.json()
        cacheSet(cacheKey, data)
      }
    }
    if (data) {
      const starsCount = Number(data.stargazers_count ?? 0)
      repoStarsCount = starsCount
      const starsFmt = starsCount.toLocaleString('pt-BR')

      const starCount = document.getElementById('starCount')
      if (starCount) starCount.textContent = `${starsFmt}`

      // Update progress bar to 10k
      const GOAL = 10000
      const pct = Math.max(0, Math.min(100, Math.round((starsCount / GOAL) * 100)))
      const bar = document.getElementById('starsProgressBar')
      const label = document.getElementById('starsProgressLabel')
      const pctLabel = document.getElementById('starsProgressPct')
      if (bar) bar.style.width = `${pct}%`
      if (label) label.textContent = `${starsFmt} / ${GOAL.toLocaleString('pt-BR')}`
      if (pctLabel) pctLabel.textContent = `${pct}%`
    }
  } catch (_) {
    // noop: keep placeholders on failure
  }

  // Fetch latest stargazers (last 10, newest first, fill from previous page if needed)
  try {
    const perPage = 10
    const lastPage = Math.max(1, Math.ceil((repoStarsCount || 1) / perPage))

    const fetchPage = async (page) => {
      const cacheKey = `gh:stargazers:${repo}:p${page}:pp${perPage}`
      let payload = cacheGet(cacheKey, TTL)
      if (!payload) {
        const res = await fetch(`https://api.github.com/repos/${repo}/stargazers?per_page=${perPage}&page=${page}`, {
          headers: { 'Accept': 'application/vnd.github.v3.star+json' }
        })
        if (!res.ok) return []
        payload = await res.json()
        cacheSet(cacheKey, payload)
      }
      if (!Array.isArray(payload)) return []
      if (payload.length && (payload[0]?.user || payload[0]?.starred_at)) {
        return payload
          .map((it) => ({
            login: it?.user?.login,
            avatar_url: it?.user?.avatar_url,
            html_url: it?.user?.html_url || (it?.user?.login ? `https://github.com/${it.user.login}` : '#'),
            starred_at: it?.starred_at ? Date.parse(it.starred_at) : 0
          }))
          .filter((u) => u.login)
      }
      // Fallback if server ignores star+json
      return payload.map((u) => ({
        login: u.login,
        avatar_url: u.avatar_url,
        html_url: u.html_url || (u.login ? `https://github.com/${u.login}` : '#'),
        starred_at: 0
      }))
    }

    let entries = await fetchPage(lastPage)
    if (entries.length < perPage && lastPage > 1) {
      const prev = await fetchPage(lastPage - 1)
      entries = entries.concat(prev)
    }

    // Sort newest first and cap to perPage
    entries.sort((a, b) => b.starred_at - a.starred_at)
    entries = entries.slice(0, perPage)

    // Render
    const list = document.getElementById('stargazersList')
    if (list) {
      entries.forEach((u) => {
        const li = document.createElement('li')
        li.className = 'flex items-center gap-2'
        const a = document.createElement('a')
        a.href = u.html_url
        a.target = '_blank'
        a.rel = 'noopener'
        a.className = 'group inline-flex items-center gap-2 rounded-full border border-white/10 bg-slate-800/60 px-3 py-1.5 text-sm text-slate-200 hover:bg-slate-800'
        const img = document.createElement('img')
        img.src = u.avatar_url
        img.alt = u.login
        img.width = 22
        img.height = 22
        img.loading = 'lazy'
        img.decoding = 'async'
        img.className = 'h-[22px] w-[22px] rounded-full ring-1 ring-white/10'
        const span = document.createElement('span')
        span.textContent = u.login
        a.appendChild(img)
        a.appendChild(span)
        li.appendChild(a)
        list.appendChild(li)
      })
    }
  } catch (_) {
    // ignore
  }

  // Copy install command
  const copyBtn = document.getElementById('copyBtn')
  const installCmd = document.getElementById('installCmd')
  if (copyBtn && installCmd) {
    copyBtn.addEventListener('click', async () => {
      try {
        const text = installCmd.textContent ?? ''
        await navigator.clipboard.writeText(text)
        const old = copyBtn.textContent
        copyBtn.textContent = 'Copiado!'
        setTimeout(() => (copyBtn.textContent = old), 1200)
      } catch (_) {
        // ignore
      }
    })
  }

  // Reveal on scroll
  const revealEls = Array.from(document.querySelectorAll('.reveal'))
  if (revealEls.length) {
    const io = new IntersectionObserver((entries) => {
      for (const entry of entries) {
        if (entry.isIntersecting) {
          entry.target.classList.add('revealed')
          io.unobserve(entry.target)
        }
      }
    }, { rootMargin: '0px 0px -10% 0px', threshold: 0.12 })
    revealEls.forEach((el) => io.observe(el))
  }

  // Tilt cards
  const tiltCards = Array.from(document.querySelectorAll('.tilt-card'))
  const prefersReduced = window.matchMedia('(prefers-reduced-motion: reduce)').matches
  tiltCards.forEach((card) => {
    const bounds = () => card.getBoundingClientRect()
    let frame = 0
    const onMove = (e) => {
      const r = bounds()
      const px = (e.clientX - r.left) / r.width
      const py = (e.clientY - r.top) / r.height
      const rotY = (px - 0.5) * 10
      const rotX = (0.5 - py) * 8
      const tx = (px - 0.5) * 8
      const ty = (py - 0.5) * 8
      if (prefersReduced) return
      if (!frame) frame = requestAnimationFrame(() => {
        card.style.transform = `perspective(1000px) rotateX(${rotX.toFixed(2)}deg) rotateY(${rotY.toFixed(2)}deg) translate3d(${tx.toFixed(2)}px, ${ty.toFixed(2)}px, 0)`
        frame = 0
      })
    }
    const onLeave = () => {
      card.style.transform = 'perspective(1000px)'
    }
    card.addEventListener('mousemove', onMove)
    card.addEventListener('mouseleave', onLeave)
  })

  // Modal: Automação concorrente
  const openModalBtn = document.getElementById('openConcurrentModal')
  const closeModalBtn = document.getElementById('closeConcurrentModal')
  const modal = document.getElementById('concurrentModal')
  const copyConcurrentCodeBtn = document.getElementById('copyConcurrentCode')
  const concurrentCodeBlock = document.getElementById('concurrentCodeBlock')
  const toggleModal = (show) => {
    if (!modal) return
    modal.classList.toggle('hidden', !show)
    modal.classList.toggle('flex', show)
  }
  if (openModalBtn && modal) openModalBtn.addEventListener('click', () => toggleModal(true))
  if (closeModalBtn && modal) closeModalBtn.addEventListener('click', () => toggleModal(false))
  if (modal) {
    modal.addEventListener('click', (e) => { if (e.target === modal) toggleModal(false) })
    document.addEventListener('keydown', (e) => { if (e.key === 'Escape') toggleModal(false) })
  }

  // Copy concurrent code
  if (copyConcurrentCodeBtn && concurrentCodeBlock) {
    copyConcurrentCodeBtn.addEventListener('click', async () => {
      try {
        const text = concurrentCodeBlock.innerText || concurrentCodeBlock.textContent || ''
        await navigator.clipboard.writeText(text)
        const old = copyConcurrentCodeBtn.textContent
        copyConcurrentCodeBtn.textContent = 'Copiado!'
        setTimeout(() => (copyConcurrentCodeBtn.textContent = old), 1000)
      } catch (_) {}
    })
  }

  // (removido: bloco redundante de cópia de preferências)

  // Copy buttons for vertical cards
  const bindCopy = (btnId, codeElId) => {
    const btn = document.getElementById(btnId)
    const codeEl = document.getElementById(codeElId)
    if (!btn || !codeEl) return
    btn.addEventListener('click', async () => {
      try {
        const text = codeEl.innerText || codeEl.textContent || ''
        await navigator.clipboard.writeText(text)
        const old = btn.textContent
        btn.textContent = 'Copiado!'
        setTimeout(() => (btn.textContent = old), 1000)
      } catch (_) {}
    })
  }
  bindCopy('copyConcurrentBtn', 'codeConcurrent')
  bindCopy('copyRequestsBtn', 'codeRequests')
  bindCopy('copyPrefsBtn', 'codePrefs')

  // Mobile menu toggle
  const mobileMenuButton = document.getElementById('mobileMenuButton')
  const mobileMenu = document.getElementById('mobileMenu')
  const iconMenu = document.getElementById('iconMenu')
  const iconClose = document.getElementById('iconClose')
  if (mobileMenuButton && mobileMenu && iconMenu && iconClose) {
    const setExpanded = (expanded) => {
      mobileMenuButton.setAttribute('aria-expanded', String(expanded))
      mobileMenu.classList.toggle('hidden', !expanded)
      iconMenu.classList.toggle('hidden', expanded)
      iconClose.classList.toggle('hidden', !expanded)
    }
    mobileMenuButton.addEventListener('click', () => {
      const isOpen = mobileMenuButton.getAttribute('aria-expanded') === 'true'
      setExpanded(!isOpen)
    })
    // Close on escape and when clicking links
    document.addEventListener('keydown', (e) => {
      if (e.key === 'Escape') setExpanded(false)
    })
    mobileMenu.addEventListener('click', (e) => {
      const target = e.target
      if (target instanceof HTMLElement && target.tagName === 'A') setExpanded(false)
    })
  }

  // (CTA final não requer JS adicional)

  // Feature cards -> modals
  const modalMap = [
    { card: 'cardZeroConfig', modal: 'modalZeroConfig', close: 'closeZeroConfigModal' },
    { card: 'cardAsync', modal: 'modalAsync', close: 'closeAsyncModal' },
    { card: 'cardTypeSafety', modal: 'modalTypeSafety', close: 'closeTypeSafetyModal' },
    { card: 'cardRequests', modal: 'modalRequests', close: 'closeRequestsModal' },
    { card: 'cardIntuitive', modal: 'modalIntuitive', close: 'closeIntuitiveModal' },
    { card: 'cardEvents', modal: 'modalEvents', close: 'closeEventsModal' },
  ]

  const toggleGenericModal = (el, show) => {
    if (!el) return
    el.classList.toggle('hidden', !show)
    el.classList.toggle('flex', show)
  }

  modalMap.forEach(({ card, modal, close }) => {
    const cardEl = document.getElementById(card)
    const modalEl = document.getElementById(modal)
    const closeEl = document.getElementById(close)

    if (cardEl && modalEl) cardEl.addEventListener('click', () => toggleGenericModal(modalEl, true))
    if (closeEl && modalEl) closeEl.addEventListener('click', () => toggleGenericModal(modalEl, false))
    if (modalEl) {
      modalEl.addEventListener('click', (e) => { if (e.target === modalEl) toggleGenericModal(modalEl, false) })
      document.addEventListener('keydown', (e) => { if (e.key === 'Escape') toggleGenericModal(modalEl, false) })
    }
  })
})()


// You can add more sponsors by pushing new objects to this array
const SPONSORS = [
  {
    name: 'The Web Scraping Club',
    url: 'https://substack.thewebscraping.club/p/pydoll-webdriver-scraping?utm_source=github&utm_medium=repo&utm_campaign=pydoll',
    logo: '/images/logo-the-webscraping-club.png',
    width: 200,
    height: 45
  },
  {
    name: 'Thordata',
    url: 'https://www.thordata.com/?ls=github&lk=pydoll',
    logo: '/images/Thordata-logo.png',
    width: 200,
    height: 45
  },
  {
    name: 'LambdaTest',
    url: 'https://www.testmuai.com/?utm_medium=sponsor&utm_source=pydoll',
    logo: '/images/logo-lamda-test.svg',
    width: 200,
    height: 45
  },
  {
    name: 'CapSolver',
    url: 'https://dashboard.capsolver.com/passport/register?inviteCode=WPhTbOsbXEpc',
    logo: '/images/capsolver-logo.png',
    width: 200,
    height: 45
  }
]

function renderSponsors(gridId = 'sponsorsGrid') {
  const grid = document.getElementById(gridId)
  if (!grid || !Array.isArray(SPONSORS)) return

  const frag = document.createDocumentFragment()
  for (const s of SPONSORS) {
    const li = document.createElement('li')
    li.className = 'flex items-center justify-center'

    const a = document.createElement('a')
    a.href = s.url
    a.target = '_blank'
    a.rel = 'noopener nofollow sponsored'
    a.className = 'group block w-full rounded-lg bg-slate-900/40 px-4 py-3 hover:bg-white/5 transition-colors'

    const img = document.createElement('img')
    img.src = s.logo
    img.alt = s.name
    img.loading = 'lazy'
    img.decoding = 'async'
    img.width = s.width || 200
    img.height = s.height || 40
    img.className = 'mx-auto max-h-10'

    a.appendChild(img)
    li.appendChild(a)
    frag.appendChild(li)
  }
  grid.innerHTML = ''
  grid.appendChild(frag)
}

document.addEventListener('DOMContentLoaded', () => {
  renderSponsors()
})


================================================
FILE: public/scripts/extra.js
================================================
function setupTermynal() {
    document.querySelectorAll(".use-termynal").forEach(node => {
        node.style.display = "block";
        new Termynal(node, {
            lineDelay: 500
        });
    });
    const progressLiteralStart = "---> 100%";
    const promptLiteralStart = "$ ";
    const customPromptLiteralStart = "# ";
    const termynalActivateClass = "termy";
    let termynals = [];

    function createTermynals() {
        document
            .querySelectorAll(`.${termynalActivateClass} .highlight code`)
            .forEach(node => {
                const text = node.textContent;
                const lines = text.split("\n");
                const useLines = [];
                let buffer = [];
                function saveBuffer() {
                    if (buffer.length) {
                        let isBlankSpace = true;
                        buffer.forEach(line => {
                            if (line) {
                                isBlankSpace = false;
                            }
                        });
                        dataValue = {};
                        if (isBlankSpace) {
                            dataValue["delay"] = 0;
                        }
                        if (buffer[buffer.length - 1] === "") {
                            // A last single <br> won't have effect
                            // so put an additional one
                            buffer.push("");
                        }
                        const bufferValue = buffer.join("<br>");
                        dataValue["value"] = bufferValue;
                        useLines.push(dataValue);
                        buffer = [];
                    }
                }
                for (let line of lines) {
                    if (line === progressLiteralStart) {
                        saveBuffer();
                        useLines.push({
                            type: "progress"
                        });
                    } else if (line.startsWith(promptLiteralStart)) {
                        saveBuffer();
                        const value = line.replace(promptLiteralStart, "").trimEnd();
                        useLines.push({
                            type: "input",
                            value: value
                        });
                    } else if (line.startsWith("// ")) {
                        saveBuffer();
                        const value = "💬 " + line.replace("// ", "").trimEnd();
                        useLines.push({
                            value: value,
                            class: "termynal-comment",
                            delay: 0
                        });
                    } else if (line.startsWith(customPromptLiteralStart)) {
                        saveBuffer();
                        const promptStart = line.indexOf(promptLiteralStart);
                        if (promptStart === -1) {
                            console.error("Custom prompt found but no end delimiter", line)
                        }
                        const prompt = line.slice(0, promptStart).replace(customPromptLiteralStart, "")
                        let value = line.slice(promptStart + promptLiteralStart.length);
                        useLines.push({
                            type: "input",
                            value: value,
                            prompt: prompt
                        });
                    } else {
                        buffer.push(line);
                    }
                }
                saveBuffer();
                const div = document.createElement("div");
                node.replaceWith(div);
                const termynal = new Termynal(div, {
                    lineData: useLines,
                    noInit: true,
                    lineDelay: 500
                });
                termynals.push(termynal);
            });
    }

    function loadVisibleTermynals() {
        termynals = termynals.filter(termynal => {
            if (termynal.container.getBoundingClientRect().top - innerHeight <= 0) {
                termynal.init();
                return false;
            }
            return true;
        });
    }
    window.addEventListener("scroll", loadVisibleTermynals);
    createTermynals();
    loadVisibleTermynals();
}

function shuffle(array) {
    var currentIndex = array.length, temporaryValue, randomIndex;
    while (0 !== currentIndex) {
        randomIndex = Math.floor(Math.random() * currentIndex);
        currentIndex -= 1;
        temporaryValue = array[currentIndex];
        array[currentIndex] = array[randomIndex];
        array[randomIndex] = temporaryValue;
    }
    return array;
}

async function showRandomAnnouncement(groupId, timeInterval) {
    const announceFastAPI = document.getElementById(groupId);
    if (announceFastAPI) {
        let children = [].slice.call(announceFastAPI.children);
        children = shuffle(children)
        let index = 0
        const announceRandom = () => {
            children.forEach((el, i) => { el.style.display = "none" });
            children[index].style.display = "block"
            index = (index + 1) % children.length
        }
        announceRandom()
        setInterval(announceRandom, timeInterval
        )
    }
}

async function main() {
    setupTermynal();
    showRandomAnnouncement('announce-left', 5000)
    showRandomAnnouncement('announce-right', 10000)
}
document$.subscribe(() => {
    main()
})

================================================
FILE: public/scripts/termynal.js
================================================
/**
 * termynal.js
 * A lightweight, modern and extensible animated terminal window, using
 * async/await.
 *
 * @author Ines Montani <ines@ines.io>
 * @version 0.0.1
 * @license MIT
 */

'use strict';

/** Generate a terminal widget. */
class Termynal {
    /**
     * Construct the widget's settings.
     * @param {(string|Node)=} container - Query selector or container element.
     * @param {Object=} options - Custom settings.
     * @param {string} options.prefix - Prefix to use for data attributes.
     * @param {number} options.startDelay - Delay before animation, in ms.
     * @param {number} options.typeDelay - Delay between each typed character, in ms.
     * @param {number} options.lineDelay - Delay between each line, in ms.
     * @param {number} options.progressLength - Number of characters displayed as progress bar.
     * @param {string} options.progressChar – Character to use for progress bar, defaults to █.
	 * @param {number} options.progressPercent - Max percent of progress.
     * @param {string} options.cursor – Character to use for cursor, defaults to ▋.
     * @param {Object[]} lineData - Dynamically loaded line data objects.
     * @param {boolean} options.noInit - Don't initialise the animation.
     */
    constructor(container = '#termynal', options = {}) {
        this.container = (typeof container === 'string') ? document.querySelector(container) : container;
        this.pfx = `data-${options.prefix || 'ty'}`;
        this.originalStartDelay = this.startDelay = options.startDelay
            || parseFloat(this.container.getAttribute(`${this.pfx}-startDelay`)) || 600;
        this.originalTypeDelay = this.typeDelay = options.typeDelay
            || parseFloat(this.container.getAttribute(`${this.pfx}-typeDelay`)) || 90;
        this.originalLineDelay = this.lineDelay = options.lineDelay
            || parseFloat(this.container.getAttribute(`${this.pfx}-lineDelay`)) || 1500;
        this.progressLength = options.progressLength
            || parseFloat(this.container.getAttribute(`${this.pfx}-progressLength`)) || 40;
        this.progressChar = options.progressChar
            || this.container.getAttribute(`${this.pfx}-progressChar`) || '█';
		this.progressPercent = options.progressPercent
            || parseFloat(this.container.getAttribute(`${this.pfx}-progressPercent`)) || 100;
        this.cursor = options.cursor
            || this.container.getAttribute(`${this.pfx}-cursor`) || '▋';
        this.lineData = this.lineDataToElements(options.lineData || []);
        this.loadLines()
        if (!options.noInit) this.init()
    }

    loadLines() {
        // Load all the lines and create the container so that the size is fixed
        // Otherwise it would be changing and the user viewport would be constantly
        // moving as she/he scrolls
        const finish = this.generateFinish()
        finish.style.visibility = 'hidden'
        this.container.appendChild(finish)
        // Appends dynamically loaded lines to existing line elements.
        this.lines = [...this.container.querySelectorAll(`[${this.pfx}]`)].concat(this.lineData);
        for (let line of this.lines) {
            line.style.visibility = 'hidden'
            this.container.appendChild(line)
        }
        const restart = this.generateRestart()
        restart.style.visibility = 'hidden'
        this.container.appendChild(restart)
        this.container.setAttribute('data-termynal', '');
    }

    /**
     * Initialise the widget, get lines, clear container and start animation.
     */
    init() {
        /**
         * Calculates width and height of Termynal container.
         * If container is empty and lines are dynamically loaded, defaults to browser `auto` or CSS.
         */
        const containerStyle = getComputedStyle(this.container);
        this.container.style.width = containerStyle.width !== '0px' ?
            containerStyle.width : undefined;
        this.container.style.minHeight = containerStyle.height !== '0px' ?
            containerStyle.height : undefined;

        this.container.setAttribute('data-termynal', '');
        this.container.innerHTML = '';
        for (let line of this.lines) {
            line.style.visibility = 'visible'
        }
        this.start();
    }

    /**
     * Start the animation and rener the lines depending on their data attributes.
     */
    async start() {
        this.addFinish()
        await this._wait(this.startDelay);

        for (let line of this.lines) {
            const type = line.getAttribute(this.pfx);
            const delay = line.getAttribute(`${this.pfx}-delay`) || this.lineDelay;

            if (type == 'input') {
                line.setAttribute(`${this.pfx}-cursor`, this.cursor);
                await this.type(line);
                await this._wait(delay);
            }

            else if (type == 'progress') {
                await this.progress(line);
                await this._wait(delay);
            }

            else {
                this.container.appendChild(line);
                await this._wait(delay);
            }

            line.removeAttribute(`${this.pfx}-cursor`);
        }
        this.addRestart()
        this.finishElement.style.visibility = 'hidden'
        this.lineDelay = this.originalLineDelay
        this.typeDelay = this.originalTypeDelay
        this.startDelay = this.originalStartDelay
    }

    generateRestart() {
        const restart = document.createElement('a')
        restart.onclick = (e) => {
            e.preventDefault()
            this.container.innerHTML = ''
            this.init()
        }
        restart.href = '#'
        restart.setAttribute('data-terminal-control', '')
        restart.innerHTML = "restart ↻"
        return restart
    }

    generateFinish() {
        const finish = document.createElement('a')
        finish.onclick = (e) => {
            e.preventDefault()
            this.lineDelay = 0
            this.typeDelay = 0
            this.startDelay = 0
        }
        finish.href = '#'
        finish.setAttribute('data-terminal-control', '')
        finish.innerHTML = "fast →"
        this.finishElement = finish
        return finish
    }

    addRestart() {
        const restart = this.generateRestart()
        this.container.appendChild(restart)
    }

    addFinish() {
        const finish = this.generateFinish()
        this.container.appendChild(finish)
    }

    /**
     * Animate a typed line.
     * @param {Node} line - The line element to render.
     */
    async type(line) {
        const chars = [...line.textContent];
        line.textContent = '';
        this.container.appendChild(line);

        for (let char of chars) {
            const delay = line.getAttribute(`${this.pfx}-typeDelay`) || this.typeDelay;
            await this._wait(delay);
            line.textContent += char;
        }
    }

    /**
     * Animate a progress bar.
     * @param {Node} line - The line element to render.
     */
    async progress(line) {
        const progressLength = line.getAttribute(`${this.pfx}-progressLength`)
            || this.progressLength;
        const progressChar = line.getAttribute(`${this.pfx}-progressChar`)
            || this.progressChar;
        const chars = progressChar.repeat(progressLength);
		const progressPercent = line.getAttribute(`${this.pfx}-progressPercent`)
			|| this.progressPercent;
        line.textContent = '';
        this.container.appendChild(line);

        for (let i = 1; i < chars.length + 1; i++) {
            await this._wait(this.typeDelay);
            const percent = Math.round(i / chars.length * 100);
            line.textContent = `${chars.slice(0, i)} ${percent}%`;
			if (percent>progressPercent) {
				break;
			}
        }
    }

    /**
     * Helper function for animation delays, called with `await`.
     * @param {number} time - Timeout, in ms.
     */
    _wait(time) {
        return new Promise(resolve => setTimeout(resolve, time));
    }

    /**
     * Converts line data objects into line elements.
     *
     * @param {Object[]} lineData - Dynamically loaded lines.
     * @param {Object} line - Line data object.
     * @returns {Element[]} - Array of line elements.
     */
    lineDataToElements(lineData) {
        return lineData.map(line => {
            let div = document.createElement('div');
            div.innerHTML = `<span ${this._attributes(line)}>${line.value || ''}</span>`;

            return div.firstElementChild;
        });
    }

    /**
     * Helper function for generating attributes string.
     *
     * @param {Object} line - Line data object.
     * @returns {string} - String of attributes.
     */
    _attributes(line) {
        let attrs = '';
        for (let prop in line) {
            // Custom add class
            if (prop === 'class') {
                attrs += ` class=${line[prop]} `
                continue
            }
            if (prop === 'type') {
                attrs += `${this.pfx}="${line[prop]}" `
            } else if (prop !== 'value') {
                attrs += `${this.pfx}-${prop}="${line[prop]}" `
            }
        }

        return attrs;
    }
}

/**
* HTML API: If current script has container(s) specified, initialise Termynal.
*/
if (document.currentScript.hasAttribute('data-termynal-container')) {
    const containers = document.currentScript.getAttribute('data-termynal-container');
    containers.split('|')
        .forEach(container => new Termynal(container))
}

================================================
FILE: public/sitemap.xml
================================================
<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
  <url>
    <loc>https://pydoll.tech/</loc>
    <lastmod>2025-11-04</lastmod>
    <changefreq>weekly</changefreq>
    <priority>1.0</priority>
  </url>
  <url>
    <loc>https://pydoll.tech/docs/</loc>
    <lastmod>2025-11-04</lastmod>
    <changefreq>weekly</changefreq>
    <priority>0.9</priority>
  </url>
  <url>
    <loc>https://pydoll.tech/docs/pt/</loc>
    <lastmod>2025-11-04</lastmod>
    <changefreq>weekly</changefreq>
    <priority>0.8</priority>
  </url>
  <url>
    <loc>https://pydoll.tech/docs/zh/</loc>
    <lastmod>2025-11-04</lastmod>
    <changefreq>weekly</changefreq>
    <priority>0.8</priority>
  </url>
</urlset>


================================================
FILE: public/stylesheets/extra.css
================================================
.termynal-comment {
  color: #4a968f;
  font-style: italic;
  display: block;
}

.termy {
  /* For right to left languages */
  direction: ltr;
}

.termy [data-termynal] {
  white-space: pre-wrap;
}

.termy .linenos {
  display: none;
}

.label-class {
  background-color: #1e88e5;
  color: white;
  padding: 2px 6px;
  font-size: 0.75em;
  border-radius: 4px;
  font-family: monospace;
}

.label-attr {
  background-color: #fb8c00;
  color: white;
  padding: 2px 6px;
  font-size: 0.75em;
  border-radius: 4px;
  font-family: monospace;
}

.label-meth {
  background-color: #43a047;
  color: white;
  padding: 2px 6px;
  font-size: 0.75em;
  border-radius: 4px;
  font-family: monospace;
}


[data-md-color-scheme="default"] {
  --md-primary-fg-color:        #0D141C;
  --md-primary-fg-color--light: #3a7e9d;
  --md-primary-fg-color--dark:  #004059;
  
  --md-accent-fg-color: #0091d0;
  --md-accent-bg-color: rgba(0, 145, 208, 0.1);
  
  /* Background color personalizado */
  --md-default-bg-color: #E2ECED;
}

[data-md-color-scheme="slate"] {
  --md-primary-fg-color:        #2b1d43;
  --md-primary-fg-color--light: #b4b7bc;
  --md-primary-fg-color--dark:  #2b1d43;

  --md-accent-fg-color: #8caabf;
  --md-accent-bg-color: rgba(140, 170, 191, 0.1);
  
  --md-default-bg-color: #0D141C;
  --md-default-fg-color: #ffffff;
}


[data-md-color-scheme="slate"] .md-content h3 a,
[data-md-color-scheme="slate"] .md-content h2 a,
[data-md-color-scheme="slate"] .md-content h1 a {
  color: inherit !important;
  text-decoration: none;
}

[data-md-color-scheme="slate"] .md-content h3 a:hover,
[data-md-color-scheme="slate"] .md-content h2 a:hover,
[data-md-color-scheme="slate"] .md-content h1 a:hover {
  text-decoration: underline;
  opacity: 0.8;
}

/* Corrigir links dentro de cabeçalhos no modo claro */
[data-md-color-scheme="default"] .md-content h3 a,
[data-md-color-scheme="default"] .md-content h2 a,
[data-md-color-scheme="default"] .md-content h1 a {
  color: inherit !important; /* Herdar a cor do cabeçalho pai */
  text-decoration: none;
}

[data-md-color-scheme="default"] .md-content h3 a:hover,
[data-md-color-scheme="default"] .md-content h2 a:hover,
[data-md-color-scheme="default"] .md-content h1 a:hover {
  text-decoration: underline;
  opacity: 0.8;
}

/* Estilo básico para links ativos - modo claro */
.md-nav__link--active {
  font-weight: bold;
  color: var(--md-accent-fg-color);
}

/* Sobrescrever cor apenas para o modo escuro */
[data-md-color-scheme="slate"] .md-nav__link--active {
  color: #b4c0dd; /* Cor clara para contraste no modo escuro */
}

/* Logo personalizado */
.md-header__button.md-logo img,
.md-header__button.md-logo svg {
  display: none;
}

.md-header__button.md-logo {
  background-image: url('../images/logo.png');
  background-size: contain;
  background-repeat: no-repeat;
  background-position: center;
  width: 100px;
  height: 50px;
}

.md-header__button.md-logo:before {
  content: '';
  display: block;
  width: 100%;
  height: 100%;
}

/* Ocultar o nome do site no cabeçalho */
.md-header__topic {
  display: none;
}

/* Logo automático baseado no tema para a página index */
/* Ocultar todas as imagens de logo por padrão */
.md-content img[alt="Pydoll Logo"] {
  display: none;
}

/* Modo claro - mostrar logo roxo */
[data-md-color-scheme="default"] .md-content img[alt="Pydoll Logo"] {
  display: block;
  content: url('../images/logo-black.png');
}

/* Modo escuro - mostrar logo cinza */
[data-md-color-scheme="slate"] .md-content img[alt="Pydoll Logo"] {
  display: block;
  content: url('../images/logo.png');
}

/* ===== MELHORIAS DE LINKS PARA MODO ESCURO ===== */

/* Links gerais no conteúdo - modo escuro */
[data-md-color-scheme="slate"] .md-content a {
  color: #64b5f6 !important; /* Azul claro para boa visibilidade */
  text-decoration: none;
}

[data-md-color-scheme="slate"] .md-content a:hover {
  color: #90caf9 !important; /* Azul mais claro no hover */
  text-decoration: underline;
}

/* Links na navegação lateral - modo escuro */
[data-md-color-scheme="slate"] .md-nav__link {
  color: #e0e0e0 !important; /* Cinza claro para links normais */
}

[data-md-color-scheme="slate"] .md-nav__link:hover {
  color: #ffffff !important; /* Branco no hover */
}

[data-md-color-scheme="slate"] .md-nav__link--active {
  color: #90caf9 !important; /* Verde claro para link ativo */
  font-weight: bold;
}

/* Links em tabelas - modo escuro */
[data-md-color-scheme="slate"] .md-typeset table a {
  color: #64b5f6 !important;
}

[data-md-color-scheme="slate"] .md-typeset table a:hover {
  color: #90caf9 !important;
}

/* Links em listas - modo escuro */
[data-md-color-scheme="slate"] .md-typeset ul a,
[data-md-color-scheme="slate"] .md-typeset ol a {
  color: #64b5f6 !important;
}

[data-md-color-scheme="slate"] .md-typeset ul a:hover,
[data-md-color-scheme="slate"] .md-typeset ol a:hover {
  color: #90caf9 !important;
}

/* Links em admonitions (caixas de aviso) - modo escuro */
[data-md-color-scheme="slate"] .md-typeset .admonition a {
  color: #64b5f6 !important;
}

[data-md-color-scheme="slate"] .md-typeset .admonition a:hover {
  color: #90caf9 !important;
}

/* ===== MELHORIAS DE LINKS PARA MODO CLARO ===== */

/* Links gerais no conteúdo - modo claro */
[data-md-color-scheme="default"] .md-content a {
  color: #1976d2 !important; /* Azul escuro para boa visibilidade */
  text-decoration: none;
}

[data-md-color-scheme="default"] .md-content a:hover {
  color: #1565c0 !important; /* Azul mais escuro no hover */
  text-decoration: underline;
}

/* Links na navegação lateral - modo claro */
[data-md-color-scheme="default"] .md-nav__link {
  color: #424242 !important; /* Cinza escuro para links normais */
}

[data-md-color-scheme="default"] .md-nav__link:hover {
  color: #1976d2 !important; /* Azul no hover */
}

[data-md-color-scheme="default"] .md-nav__link--active {
  color: #2e7d32 !important; /* Verde escuro para link ativo */
  font-weight: bold;
}

/* Links em tabelas - modo claro */
[data-md-color-scheme="default"] .md-typeset table a {
  color: #1976d2 !important;
}

[data-md-color-scheme="default"] .md-typeset table a:hover {
  color: #1565c0 !important;
}


================================================
FILE: public/stylesheets/termynal.css
================================================
/**
 * termynal.js
 *
 * @author Ines Montani <ines@ines.io>
 * @version 0.0.1
 * @license MIT
 */

 :root {
    --color-bg: #252a33;
    --color-text: #eee;
    --color-text-subtle: #a2a2a2;
}

[data-termynal] {
    width: 750px;
    max-width: 100%;
    background: var(--color-bg);
    color: var(--color-text);
    /* font-size: 18px; */
    font-size: 15px;
    /* font-family: 'Fira Mono', Consolas, Menlo, Monaco, 'Courier New', Courier, monospace; */
    font-family: 'Roboto Mono', 'Fira Mono', Consolas, Menlo, Monaco, 'Courier New', Courier, monospace;
    border-radius: 4px;
    padding: 75px 45px 35px;
    position: relative;
    -webkit-box-sizing: border-box;
            box-sizing: border-box;
    /* Custom line-height */
    line-height: 1.2;
}

[data-termynal]:before {
    content: '';
    position: absolute;
    top: 15px;
    left: 15px;
    display: inline-block;
    width: 15px;
    height: 15px;
    border-radius: 50%;
    /* A little hack to display the window buttons in one pseudo element. */
    background: #d9515d;
    -webkit-box-shadow: 25px 0 0 #f4c025, 50px 0 0 #3ec930;
            box-shadow: 25px 0 0 #f4c025, 50px 0 0 #3ec930;
}

[data-termynal]:after {
    content: 'bash';
    position: absolute;
    color: var(--color-text-subtle);
    top: 5px;
    left: 0;
    width: 100%;
    text-align: center;
}

a[data-terminal-control] {
    text-align: right;
    display: block;
    color: #aebbff;
}

[data-ty] {
    display: block;
    line-height: 2;
}

[data-ty]:before {
    /* Set up defaults and ensure empty lines are displayed. */
    content: '';
    display: inline-block;
    vertical-align: middle;
}

[data-ty="input"]:before,
[data-ty-prompt]:before {
    margin-right: 0.75em;
    color: var(--color-text-subtle);
}

[data-ty="input"]:before {
    content: '$';
}

[data-ty][data-ty-prompt]:before {
    content: attr(data-ty-prompt);
}

[data-ty-cursor]:after {
    content: attr(data-ty-cursor);
    font-family: monospace;
    margin-left: 0.5em;
    -webkit-animation: blink 1s infinite;
            animation: blink 1s infinite;
}


/* Cursor animation */

@-webkit-keyframes blink {
    50% {
        opacity: 0;
    }
}

@keyframes blink {
    50% {
        opacity: 0;
    }
}

================================================
FILE: pydoll/__init__.py
================================================


================================================
FILE: pydoll/browser/__init__.py
================================================
from pydoll.browser.chromium.chrome import Chrome
from pydoll.browser.chromium.edge import Edge

__all__ = ['Chrome', 'Edge']


================================================
FILE: pydoll/browser/chromium/__init__.py
================================================
from pydoll.browser.chromium.chrome import Chrome
from pydoll.browser.chromium.edge import Edge

__all__ = [
    'Edge',
    'Chrome',
]


================================================
FILE: pydoll/browser/chromium/base.py
================================================
from __future__ import annotations

import asyncio
import json
import logging
import os
import shutil
import warnings
from abc import ABC, abstractmethod
from contextlib import suppress
from functools import partial
from random import randint
from typing import TYPE_CHECKING, Any, Awaitable, Callable, Optional, overload
from urllib.parse import urlsplit, urlunsplit

from pydoll.browser.managers import (
    BrowserProcessManager,
    ProxyManager,
    TempDirectoryManager,
)
from pydoll.browser.tab import Tab
from pydoll.commands import (
    BrowserCommands,
    EmulationCommands,
    FetchCommands,
    PageCommands,
    RuntimeCommands,
    StorageCommands,
    TargetCommands,
)
from pydoll.connection import ConnectionHandler
from pydoll.exceptions import (
    BrowserNotRunning,
    FailedToStartBrowser,
    InvalidConnectionPort,
    InvalidWebSocketAddress,
    MissingTargetOrWebSocket,
    NoValidTabFound,
)
from pydoll.protocol.browser.types import DownloadBehavior
from pydoll.protocol.fetch.events import FetchEvent
from pydoll.protocol.fetch.types import AuthChallengeResponseType
from pydoll.utils.user_agent_parser import UserAgentParser

if TYPE_CHECKING:
    from tempfile import TemporaryDirectory

    from pydoll.browser.interfaces import BrowserOptionsManager
    from pydoll.protocol.base import Command, Response, T_CommandParams, T_CommandResponse
    from pydoll.protocol.browser.methods import (
        GetVersionResponse,
        GetVersionResult,
        GetWindowForTargetResponse,
    )
    from pydoll.protocol.browser.types import Bounds, PermissionType
    from pydoll.protocol.fetch.events import RequestPausedEvent
    from pydoll.protocol.fetch.types import HeaderEntry
    from pydoll.protocol.network.types import (
        Cookie,
        CookieParam,
        ErrorReason,
        RequestMethod,
        ResourceType,
    )
    from pydoll.protocol.storage.methods import GetCookiesResponse
    from pydoll.protocol.target.methods import (
        CreateBrowserContextResponse,
        CreateTargetResponse,
        GetBrowserContextsResponse,
        GetTargetsResponse,
    )
    from pydoll.protocol.target.types import TargetInfo

logger = logging.getLogger(__name__)


class Browser(ABC):  # noqa: PLR0904
    """
    Abstract base class for browser automation using Chrome DevTools Protocol.

    Provides comprehensive browser control including lifecycle management,
    context handling, network interception, cookie management, and CDP commands.
    """

    def __init__(
        self,
        options_manager: BrowserOptionsManager,
        connection_port: Optional[int] = None,
    ):
        """
        Initialize browser instance with configuration.

        Args:
            options_manager: Manages browser options initialization and defaults.
                Must implement initialize_options() and add_default_arguments().
            connection_port: CDP WebSocket port. Random port (9223-9322) if None.

        Note:
            Call start() to actually launch the browser.
        """
        self._validate_connection_port(connection_port)
        self.options = options_manager.initialize_options()
        self._proxy_manager = ProxyManager(self.options)
        self._connection_port = connection_port if connection_port else randint(9223, 9322)
        self._browser_process_manager = BrowserProcessManager()
        self._temp_directory_manager = TempDirectoryManager()
        self._ws_address: Optional[str] = None
        self._connection_handler = ConnectionHandler(self._connection_port)
        self._backup_preferences_dir = ''
        self._tabs_opened: dict[str, Tab] = {}
        self._context_proxy_auth: dict[str, tuple[str, str]] = {}
        logger.debug(
            f'Browser initialized: port={self._connection_port}, '
            f'headless={getattr(self.options, "headless", None)}'
        )

    async def __aenter__(self) -> 'Browser':
        """Async context manager entry."""
        logger.debug('Entering browser async context')
        return self

    async def __aexit__(self, exc_type, exc_val, exc_tb):
        """Async context manager exit with cleanup."""
        logger.debug(f'Exiting browser async context: exc_type={exc_type}')
        if self._backup_preferences_dir:
            logger.debug(f'Restoring backup preferences directory: {self._backup_preferences_dir}')
            user_data_dir = self._get_user_data_dir()
            shutil.copy2(
                self._backup_preferences_dir,
                os.path.join(user_data_dir, 'Default', 'Preferences'),
            )
        if await self._is_browser_running(timeout=2):
            await self.stop()

        await self._connection_handler.close()

    async def connect(self, ws_address: str) -> Tab:
        """
        Connect to browser using WebSocket address. When we set
        the _ws_address attribute, the connection handler will use
        this address instead of resolving it from the connection port.

        Args:
            ws_address: WebSocket address of the browser.

        Returns:
            The first tab in the list of opened tabs.

        Note:
            You are supposed to use this method only if you want to connect to a browser
            that is already running.
        """
        logger.info(f'Connecting to browser via WebSocket: {ws_address}')
        await self._setup_ws_address(ws_address)
        tabs = await self.get_opened_tabs()
        logger.info(f'Connected. Tabs available: {len(tabs)}')
        return tabs[0]

    async def start(self, headless: bool = False) -> Tab:
        """
        Start browser process and establish CDP connection.

        Args:
            headless: Deprecated. Use `options.headless = True` instead.

        Returns:
            Initial tab for interaction.

        Raises:
            FailedToStartBrowser: If the browser fails to start or connect.
        """
        if headless:
            warnings.warn(
                "The 'headless' parameter is deprecated and will be removed in a future version. "
                'Use `options.headless = True` instead.',
                DeprecationWarning,
                stacklevel=2,
            )
            self.options.headless = headless

        binary_location = self.options.binary_location or self._get_default_binary_location()
        logger.debug('Resolved binary location: %s', binary_location)

        self._setup_user_dir()
        logger.debug('User data directory configured')
        proxy_config = self._proxy_manager.get_proxy_credentials()

        logger.info(f'Starting browser process on port {self._connection_port}')
        self._browser_process_manager.start_browser_process(
            binary_location, self._connection_port, self.options.arguments
        )
        await self._verify_browser_running()
        logger.info('Browser process started and responsive')
        await self._configure_proxy(proxy_config[0], proxy_config[1])

        valid_tab_id = await self._get_valid_tab_id(await self.get_targets())
        tab = Tab(self, target_id=valid_tab_id, connection_port=self._connection_port)
        self._tabs_opened[valid_tab_id] = tab
        await self._apply_user_agent_override(tab)
        logger.info(f'Initial tab attached: {valid_tab_id}')
        return tab

    async def stop(self):
        """
        Stop browser process and cleanup resources.

        Sends Browser.close command, terminates process, removes temp directories,
        and closes WebSocket connections.

        Raises:
            BrowserNotRunning: If the browser is not currently running.
        """
        if not await self._is_browser_running():
            logger.error('Stop called but browser is not running')
            raise BrowserNotRunning()

        logger.info('Stopping browser process')
        await self._execute_command(BrowserCommands.close())
        self._browser_process_manager.stop_process()
        await self._connection_handler.close()
        await asyncio.sleep(0.5 if os.name == 'nt' else 0.1)
        self._temp_directory_manager.cleanup()
        logger.info('Browser process stopped and resources cleaned up')

    async def close(self):
        """
        Closes the WebSocket connection and releases resources.
        """
        logger.info('Closing browser WebSocket connection')
        await self._connection_handler.close()

    async def create_browser_context(
        self, proxy_server: Optional[str] = None, proxy_bypass_list: Optional[str] = None
    ) -> str:
        """
        Create isolated browser context (like incognito).

        Browser contexts provide isolated storage and don't share session data.
        Multiple contexts can exist simultaneously.

        Args:
            proxy_server: Optional proxy for this context only (scheme://host:port).
            proxy_bypass_list: Comma-separated hosts that bypass proxy.

        Returns:
            Browser context ID for use with other methods.
        """
        # If proxy_server contains credentials, strip them and store per-context auth
        sanitized_proxy = proxy_server
        extracted_auth: Optional[tuple[str, str]] = None
        if proxy_server:
            sanitized_proxy, extracted_auth = self._sanitize_proxy_and_extract_auth(proxy_server)
            logger.debug(
                f'Creating browser context with proxy: {sanitized_proxy}'
                f'(credentials provided={bool(extracted_auth)})'
            )

        response: CreateBrowserContextResponse = await self._execute_command(
            TargetCommands.create_browser_context(
                proxy_server=sanitized_proxy,
                proxy_bypass_list=proxy_bypass_list,
            )
        )
        context_id = response['result']['browserContextId']
        if extracted_auth:
            self._context_proxy_auth[context_id] = extracted_auth
        logger.info(f'Created browser context: {context_id}')
        return context_id

    async def delete_browser_context(self, browser_context_id: str):
        """
        Delete browser context and all associated tabs/resources.

        Removes all storage (cookies, localStorage, etc.) and closes all tabs.
        The default browser context cannot be deleted.

        Note:
            Closes all associated tabs immediately.
        """
        logger.info(f'Deleting browser context: {browser_context_id}')
        return await self._execute_command(
            TargetCommands.dispose_browser_context(browser_context_id)
        )

    async def get_browser_contexts(self) -> list[str]:
        """Get all browser context IDs including the default context."""
        response: GetBrowserContextsResponse = await self._execute_command(
            TargetCommands.get_browser_contexts()
        )
        logger.debug(f'Fetched {len(response["result"]["browserContextIds"])} browser contexts')
        return response['result']['browserContextIds']

    async def new_tab(self, url: str = '', browser_context_id: Optional[str] = None) -> Tab:
        """
        Create new tab for page interaction.

        Args:
            url: Initial URL (about:blank if empty).
            browser_context_id: Context to create tab in (default if None).

        Returns:
            Tab instance for page navigation and element interaction.
        """
        logger.info(f'Creating new tab (context={browser_context_id})')
        response: CreateTargetResponse = await self._execute_command(
            TargetCommands.create_target(
                browser_context_id=browser_context_id,
            )
        )
        target_id = response['result']['targetId']
        tab = Tab(self, **self._get_tab_kwargs(target_id, browser_context_id))
        self._tabs_opened[target_id] = tab
        await self._apply_user_agent_override(tab)
        await self._setup_context_proxy_auth_for_tab(tab, browser_context_id)
        if url:
            await tab.go_to(url)
        logger.info(f'New tab created: {target_id}')
        return tab

    async def get_targets(self) -> list[TargetInfo]:
        """
        Get all active targets/pages in browser.

        Targets include pages, service workers, shared workers, and browser process.
        Useful for debugging and managing multiple tabs.

        Returns:
            List of TargetInfo objects.
        """
        response: GetTargetsResponse = await self._execute_command(TargetCommands.get_targets())
        logger.debug(f'Fetched {len(response["result"]["targetInfos"])} targets')
        return response['result']['targetInfos']

    async def get_opened_tabs(self) -> list[Tab]:
        """
        Get all opened tabs that are not extensions and have the type 'page'.
        Tabs that are already opened will be returned as is. If a new target is opened,
        a new Tab instance will be created.

        Returns:
            List of Tab instances. The last tab is the most recent one.
        """
        targets = await self.get_targets()
        valid_tab_targets = [
            target
            for target in targets
            if target['type'] == 'page' and 'extension' not in target['url']
        ]
        all_target_ids = [target['targetId'] for target in valid_tab_targets]
        existing_target_ids = list(self._tabs_opened.keys())
        remaining_target_ids = [
            target_id for target_id in all_target_ids if target_id not in existing_target_ids
        ]
        existing_tabs = [self._tabs_opened[target_id] for target_id in existing_target_ids]
        new_tabs = []
        for target_id in reversed(remaining_target_ids):
            tab = Tab(self, **self._get_tab_kwargs(target_id))
            await self._apply_user_agent_override(tab)
            new_tabs.append(tab)
        self._tabs_opened.update(dict(zip(remaining_target_ids, new_tabs)))
        logger.debug(
            f'Opened tabs resolved: existing={len(existing_tabs)}, new={len(new_tabs)}',
        )
        return existing_tabs + new_tabs

    async def get_tab_by_target(self, target: TargetInfo) -> Tab:
        tab = Tab(self, **self._get_tab_kwargs(target['targetId']))
        await self._apply_user_agent_override(tab)
        return tab

    async def set_download_path(self, path: str, browser_context_id: Optional[str] = None):
        """Set download directory path (convenience method for set_download_behavior)."""
        logger.info(f'Setting download path: {path} (context={browser_context_id})')
        return await self._execute_command(
            BrowserCommands.set_download_behavior(
                behavior=DownloadBehavior.ALLOW,
                download_path=path,
                browser_context_id=browser_context_id,
            )
        )

    async def set_download_behavior(
        self,
        behavior: DownloadBehavior,
        download_path: Optional[str] = None,
        browser_context_id: Optional[str] = None,
        events_enabled: bool = False,
    ):
        """
        Configure download handling.

        Args:
            behavior: ALLOW (save to path), DENY (cancel), or DEFAULT.
            download_path: Required if behavior is ALLOW.
            browser_context_id: Context to apply to (default if None).
            events_enabled: Generate download events for progress tracking.
        """
        logger.info(
            f'Setting download behavior: behavior={behavior},'
            f'path={download_path}, context={browser_context_id},'
            f'events={events_enabled}'
        )
        return await self._execute_command(
            BrowserCommands.set_download_behavior(
                behavior=behavior,
                download_path=download_path,
                browser_context_id=browser_context_id,
                events_enabled=events_enabled,
            )
        )

    async def delete_all_cookies(self, browser_context_id: Optional[str] = None):
        """Delete all cookies (session, persistent, third-party) from browser or context."""
        logger.info(f'Clearing all cookies (context={browser_context_id})')
        return await self._execute_command(StorageCommands.clear_cookies(browser_context_id))

    async def set_cookies(
        self, cookies: list[CookieParam], browser_context_id: Optional[str] = None
    ):
        """Set multiple cookies in browser or context."""
        logger.debug(f'Setting {len(cookies)} cookies (context={browser_context_id})')
        return await self._execute_command(StorageCommands.set_cookies(cookies, browser_context_id))

    async def get_cookies(self, browser_context_id: Optional[str] = None) -> list[Cookie]:
        """Get all cookies from browser or context.

        Note:
            This method does not work with native incognito mode (--incognito flag).
            For incognito mode, use ``tab.get_cookies()`` instead.
        """
        response: GetCookiesResponse = await self._execute_command(
            StorageCommands.get_cookies(browser_context_id)
        )
        logger.debug(
            f'Retrieved {len(response["result"]["cookies"])} cookies (context={browser_context_id})'
        )
        return response['result']['cookies']

    async def get_version(self) -> GetVersionResult:
        """Get browser version and CDP protocol information."""
        response: GetVersionResponse = await self._execute_command(BrowserCommands.get_version())
        logger.debug(f'Browser version: {response["result"]}')
        return response['result']

    async def get_window_id_for_target(self, target_id: str) -> int:
        """Get window ID for target (used for window manipulation via CDP)."""
        response: GetWindowForTargetResponse = await self._execute_command(
            BrowserCommands.get_window_for_target(target_id)
        )
        logger.debug(f'Window id for target {target_id}: {response["result"]["windowId"]}')
        return response['result']['windowId']

    async def get_window_id_for_tab(self, tab: Tab) -> int:
        """Get window ID for tab (convenience method)."""
        target_id = tab._target_id or (tab._ws_address.split('/')[-1] if tab._ws_address else None)
        if not target_id:
            logger.error('Missing target id or ws address for tab when getting window id')
            raise MissingTargetOrWebSocket()
        return await self.get_window_id_for_target(target_id)

    async def get_window_id(self) -> int:
        """
        Get window ID for any valid tab.

        Raises:
            NoValidTabFound: If no valid attached tab can be found.
        """
        targets = await self.get_targets()
        valid_tab_id = await self._get_valid_tab_id(targets)
        return await self.get_window_id_for_target(valid_tab_id)

    async def set_window_maximized(self):
        """Maximize browser window (affects all tabs in window)."""
        window_id = await self.get_window_id()
        logger.info(f'Maximizing window: id={window_id}')
        return await self._execute_command(BrowserCommands.set_window_maximized(window_id))

    async def set_window_minimized(self):
        """Minimize browser window to taskbar/dock."""
        window_id = await self.get_window_id()
        logger.info(f'Minimizing window: id={window_id}')
        return await self._execute_command(BrowserCommands.set_window_minimized(window_id))

    async def set_window_bounds(self, bounds: Bounds):
        """
        Set window position and/or size.

        Args:
            bounds: Properties to modify (left, top, width, height, windowState).
                Only specified properties are changed.
        """
        window_id = await self.get_window_id()
        logger.info(f'Setting window bounds: id={window_id}, bounds={bounds}')
        return await self._execute_command(BrowserCommands.set_window_bounds(window_id, bounds))

    async def grant_permissions(
        self,
        permissions: list[PermissionType],
        origin: Optional[str] = None,
        browser_context_id: Optional[str] = None,
    ):
        """
        Grant browser permissions (geolocation, notifications, camera, etc.).

        Bypasses normal permission prompts for automated testing.

        Args:
            permissions: Permissions to grant.
            origin: Origin to grant to (all origins if None).
            browser_context_id: Context to apply to (default if None).
        """
        logger.info(
            f'Granting permissions: {permissions} (origin={origin}, context={browser_context_id})',
        )
        return await self._execute_command(
            BrowserCommands.grant_permissions(permissions, origin, browser_context_id)
        )

    async def reset_permissions(self, browser_context_id: Optional[str] = None):
        """Reset all permissions to defaults and restore prompting behavior."""
        logger.info(f'Resetting permissions (context={browser_context_id})')
        return await self._execute_command(BrowserCommands.reset_permissions(browser_context_id))

    @overload
    async def on(
        self, event_name: str, callback: Callable[[Any], Any], temporary: bool = False
    ) -> int: ...
    @overload
    async def on(
        self, event_name: str, callback: Callable[[Any], Awaitable[Any]], temporary: bool = False
    ) -> int: ...
    async def on(self, event_name, callback, temporary: bool = False) -> int:
        """
        Register CDP event listener at browser level.

        Callback runs in background task to prevent blocking. Affects all pages/targets.

        Args:
            event_name: CDP event name (e.g., "Network.responseReceived").
            callback: Function called on event (sync or async).
            temporary: Remove after first invocation.

        Returns:
            Callback ID for removal.

        Note:
            For page-specific events, use Tab.on() instead.
        """

        async def callback_wrapper(event):
            asyncio.create_task(callback(event))

        if asyncio.iscoroutinefunction(callback):
            function_to_register = callback_wrapper
        else:
            function_to_register = callback
        logger.debug(
            f'Registering callback: event={event_name}, temporary={temporary}, '
            f'async={asyncio.iscoroutinefunction(callback)}'
        )
        return await self._connection_handler.register_callback(
            event_name, function_to_register, temporary
        )

    async def remove_callback(self, callback_id: int):
        """Remove callback from browser."""
        logger.debug(f'Removing callback: id={callback_id}')
        return await self._connection_handler.remove_callback(callback_id)

    async def enable_fetch_events(
        self,
        handle_auth_requests: bool = False,
        resource_type: Optional[ResourceType] = None,
    ):
        """
        Enable network request interception via Fetch domain.

        Allows monitoring, modifying, or blocking requests before they're sent.
        All matching requests are paused until explicitly continued.

        Args:
            handle_auth_requests: Intercept authentication challenges.
            resource_type: Filter by type (XHR, Fetch, Document, etc.). Empty = all.

        Note:
            Paused requests must be continued or they will timeout.
        """
        logger.debug(
            f'Enabling Fetch events: handle_auth={handle_auth_requests}, '
            f'resource_type={resource_type}'
        )
        return await self._connection_handler.execute_command(
            FetchCommands.enable(
                handle_auth_requests=handle_auth_requests,
                resource_type=resource_type,
            )
        )

    async def disable_fetch_events(self):
        """Disable request interception and release any paused requests."""
        logger.debug('Disabling Fetch events')
        return await self._connection_handler.execute_command(FetchCommands.disable())

    async def enable_runtime_events(self):
        """Enable runtime events."""
        logger.debug('Enabling Runtime events')
        return await self._connection_handler.execute_command(RuntimeCommands.enable())

    async def disable_runtime_events(self):
        """Disable runtime events."""
        logger.debug('Disabling Runtime events')
        return await self._connection_handler.execute_command(RuntimeCommands.disable())

    async def continue_request(
        self,
        request_id: str,
        url: Optional[str] = None,
        method: Optional[RequestMethod] = None,
        post_data: Optional[str] = None,
        headers: Optional[list[HeaderEntry]] = None,
        intercept_response: Optional[bool] = None,
    ):
        """
        Continue paused request without modifications.
        """
        logger.debug(f'Continuing request: id={request_id}')
        return await self._execute_command(
            FetchCommands.continue_request(
                request_id=request_id,
                url=url,
                method=method,
                post_data=post_data,
                headers=headers,
                intercept_response=intercept_response,
            )
        )

    async def fail_request(self, request_id: str, error_reason: ErrorReason):
        """Fail request with error code."""
        logger.debug(f'Failing request: id={request_id}, reason={error_reason}')
        return await self._execute_command(FetchCommands.fail_request(request_id, error_reason))

    async def fulfill_request(
        self,
        request_id: str,
        response_code: int,
        response_headers: Optional[list[HeaderEntry]] = None,
        body: Optional[str] = None,
        response_phrase: Optional[str] = None,
    ):
        """Fulfill request with response data."""
        logger.debug(
            f'Fulfilling request: id={request_id}, code={response_code}, '
            f'headers={bool(response_headers)}, body={bool(body)}'
        )
        return await self._execute_command(
            FetchCommands.fulfill_request(
                request_id=request_id,
                response_code=response_code,
                response_headers=response_headers,
                body=body,
                response_phrase=response_phrase,
            )
        )

    @staticmethod
    def _validate_connection_port(connection_port: Optional[int]):
        """Validate connection port."""
        if connection_port and connection_port < 0:
            logger.error(f'Invalid connection port: {connection_port}')
            raise InvalidConnectionPort()

    async def _continue_request_callback(self, event: RequestPausedEvent):
        """Internal callback to continue paused requests."""
        request_id = event['params']['requestId']
        logger.debug(f'[Fetch] REQUEST_PAUSED -> continue: id={request_id}')
        return await self.continue_request(request_id)

    async def _continue_request_with_auth_callback(
        self,
        event: RequestPausedEvent,
        proxy_username: Optional[str],
        proxy_password: Optional[str],
    ):
        """Internal callback for proxy authentication."""
        request_id = event['params']['requestId']
        logger.debug(
            f'[Fetch] AUTH_REQUIRED -> provide credentials: id={request_id}, '
            f'user_set={bool(proxy_username)}'
        )
        response: Response = await self._execute_command(
            FetchCommands.continue_request_with_auth(
                request_id,
                auth_challenge_response=AuthChallengeResponseType.PROVIDE_CREDENTIALS,
                proxy_username=proxy_username,
                proxy_password=proxy_password,
            )
        )
        await self.disable_fetch_events()
        return response

    @staticmethod
    async def _tab_continue_request_callback(event: RequestPausedEvent, tab: Tab):
        """Internal callback to continue paused requests at Tab level."""
        request_id = event['params']['requestId']
        logger.debug(f'[Tab Fetch] REQUEST_PAUSED -> continue: id={request_id}')
        return await tab.continue_request(request_id)

    @staticmethod
    async def _tab_continue_request_with_auth_callback(
        event: RequestPausedEvent,
        tab: Tab,
        proxy_username: Optional[str],
        proxy_password: Optional[str],
    ):
        """Internal callback for proxy/server authentication at Tab level."""
        request_id = event['params']['requestId']
        logger.debug(
            f'[Tab Fetch] AUTH_REQUIRED -> provide credentials: id={request_id}, '
            f'user_set={bool(proxy_username)}'
        )
        response: Response = await tab.continue_with_auth(
            request_id=request_id,
            auth_challenge_response=AuthChallengeResponseType.PROVIDE_CREDENTIALS,
            proxy_username=proxy_username,
            proxy_password=proxy_password,
        )
        await tab.disable_fetch_events()
        return response

    async def _setup_context_proxy_auth_for_tab(
        self, tab: Tab, browser_context_id: Optional[str]
    ) -> None:
        """Enable proxy auth handling for a Tab if its context has credentials stored."""
        if not browser_context_id:
            return
        creds = self._context_proxy_auth.get(browser_context_id)
        if not creds:
            return
        username, password = creds
        logger.debug(
            f'Enabling context-level proxy auth for tab (context={browser_context_id}, '
            f'user_set={bool(username)}'
        )
        await tab.enable_fetch_events(handle_auth=True)
        await tab.on(
            FetchEvent.REQUEST_PAUSED,
            partial(
                self._tab_continue_request_callback,
                tab=tab,
            ),
            temporary=True,
        )
        await tab.on(
            FetchEvent.AUTH_REQUIRED,
            partial(
                self._tab_continue_request_with_auth_callback,
                tab=tab,
                proxy_username=username,
                proxy_password=password,
            ),
            temporary=True,
        )

    async def _apply_user_agent_override(self, tab: Tab) -> None:
        """Apply consistent User-Agent override to a tab if --user-agent= is set.

        Detects the --user-agent= argument in browser options and automatically
        synchronizes HTTP headers, navigator JS properties, and Client Hints
        via CDP Emulation.setUserAgentOverride + JS injection.
        """
        user_agent = self._get_user_agent_from_options()
        if not user_agent:
            return

        parsed = UserAgentParser.parse(user_agent)
        logger.debug('Applying User-Agent override: %s', user_agent[:60])

        await tab._execute_command(
            EmulationCommands.set_user_agent_override(
                user_agent=user_agent,
                platform=parsed.platform,
                user_agent_metadata=parsed.user_agent_metadata,
            )
        )

        if parsed.navigator_override_js:
            await tab._execute_command(
                PageCommands.add_script_to_evaluate_on_new_document(
                    source=parsed.navigator_override_js,
                    run_immediately=True,
                )
            )

    def _get_user_agent_from_options(self) -> Optional[str]:
        """Extract User-Agent value from --user-agent= browser argument."""
        for arg in self.options.arguments:
            if arg.startswith('--user-agent='):
                return arg[len('--user-agent=') :]
        return None

    async def _verify_browser_running(self):
        """
        Verify browser started successfully.

        Raises:
            FailedToStartBrowser: If the browser failed to start.
        """
        logger.debug(f'Verifying browser is running (timeout={self.options.start_timeout})')
        if not await self._is_browser_running(self.options.start_timeout):
            logger.error('Browser failed to start within timeout')
            raise FailedToStartBrowser()

    async def _configure_proxy(
        self, private_proxy: bool, proxy_credentials: tuple[Optional[str], Optional[str]]
    ):
        """Setup proxy authentication handling if needed."""
        if not private_proxy:
            return

        logger.debug(
            'Configuring proxy authentication: '
            f'credentials provided={bool(proxy_credentials[0] or proxy_credentials[1])}'
        )
        await self.enable_fetch_events(handle_auth_requests=True)
        await self.on(
            FetchEvent.REQUEST_PAUSED,
            self._continue_request_callback,
            temporary=True,
        )
        await self.on(
            FetchEvent.AUTH_REQUIRED,
            partial(
                self._continue_request_with_auth_callback,
                proxy_username=proxy_credentials[0],
                proxy_password=proxy_credentials[1],
            ),
            temporary=True,
        )

    @staticmethod
    def _is_valid_tab(target: TargetInfo) -> bool:
        """Check if target is a valid browser tab (filters out extensions)."""
        return target.get('type') == 'page' and 'chrome-extension://' not in target.get('url', '')

    @staticmethod
    async def _get_valid_tab_id(targets: list[TargetInfo]) -> str:
        """
        Find valid attached tab ID.

        Raises:
            NoValidTabFound: If no valid attached tab is found.
        """
        valid_tab = next(
            (
                tab
                for tab in targets
                if tab.get('type') == 'page' and 'extension' not in tab.get('url', '')
            ),
            None,
        )

        if not valid_tab:
            logger.error(f'No valid tab found among {len(targets)} targets')
            raise NoValidTabFound()

        tab_id = valid_tab.get('targetId')
        if not tab_id:
            logger.error('Valid tab missing targetId')
            raise NoValidTabFound('Tab missing targetId')

        return tab_id

    async def _is_browser_running(self, timeout: int = 10) -> bool:
        """Check if browser process is running and CDP endpoint is responsive."""
        for _ in range(timeout):
            if await self._connection_handler.ping():
                return True
            await asyncio.sleep(1)

        return False

    async def _execute_command(
        self, command: Command[T_CommandParams, T_CommandResponse], timeout: int = 60
    ) -> T_CommandResponse:
        """Execute CDP command and return result (core method for browser communication)."""
        logger.debug(f'Executing command: {command.get("method")} (timeout={timeout})')
        return await self._connection_handler.execute_command(command, timeout=timeout)

    def _setup_user_dir(self):
        """Setup temporary user data directory if not specified in options."""
        user_data_dir = self._get_user_data_dir()
        if user_data_dir and self.options.browser_preferences:
            self._set_browser_preferences_in_user_data_dir(user_data_dir)
        elif not user_data_dir:
            temp_dir = self._temp_directory_manager.create_temp_dir()
            # For all browsers, use a temporary directory
            self.options.arguments.append(f'--user-data-dir={temp_dir.name}')
            if self.options.browser_preferences:
                self._set_browser_preferences_in_temp_dir(temp_dir)
        logger.debug(f'User dir setup complete: {self._get_user_data_dir()}')

    def _set_browser_preferences_in_temp_dir(self, temp_dir: TemporaryDirectory):
        os.mkdir(os.path.join(temp_dir.name, 'Default'))
        preferences = self.options.browser_preferences
        with open(
            os.path.join(temp_dir.name, 'Default', 'Preferences'), 'w', encoding='utf-8'
        ) as json_file:
            json.dump(preferences, json_file)
        logger.debug('Wrote browser preferences to temp user dir')

    def _set_browser_preferences_in_user_data_dir(self, user_data_dir: str):
        """
        Set browser preferences in the user data directory.

        This function will:
        1. Create a backup of the existing Preferences file if it exists
        2. Create Default directory if it doesn't exist
        3. Write the new preferences to the Preferences file

        Args:
            user_data_dir: Path to the user data directory
        """
        default_dir = os.path.join(user_data_dir, 'Default')
        os.makedirs(default_dir, exist_ok=True)

        preferences_path = os.path.join(default_dir, 'Preferences')
        self._backup_preferences_dir = os.path.join(default_dir, 'Preferences.backup')

        if os.path.exists(preferences_path):
            # Backup existing Preferences file
            shutil.copy2(preferences_path, self._backup_preferences_dir)

        preferences = {}
        if os.path.exists(preferences_path):
            with suppress(json.JSONDecodeError):
                with open(preferences_path, 'r', encoding='utf-8') as preferences_file:
                    preferences = json.load(preferences_file)
        preferences.update(self.options.browser_preferences)
        with open(preferences_path, 'w', encoding='utf-8') as json_file:
            json.dump(preferences, json_file, indent=2)
        logger.debug(f'Updated browser preferences in user data dir: {preferences_path}')

    def _get_user_data_dir(self) -> Optional[str]:
        for arg in self.options.arguments:
            if arg.startswith('--user-data-dir='):
                return arg.split('=', 1)[1]
        return None

    @staticmethod
    def _validate_ws_address(ws_address: str):
        """Validate WebSocket address."""
        min_slashes = 4
        if not ws_address.startswith(('ws://', 'wss://')):
            logger.error('Invalid WebSocket address: missing ws:// or wss:// prefix')
            raise InvalidWebSocketAddress('WebSocket address must start with ws:// or wss://')
        if len(ws_address.split('/')) < min_slashes:
            logger.error('Invalid WebSocket address: not enough slashes')
            raise InvalidWebSocketAddress(
                f'WebSocket address must contain at least {min_slashes} slashes'
            )

    async def _setup_ws_address(self, ws_address: str):
        """Setup WebSocket address for browser."""
        self._validate_ws_address(ws_address)
        self._ws_address = ws_address
        self._connection_handler._ws_address = self._ws_address
        await self._connection_handler._ensure_active_connection()
        logger.info('WebSocket address set for browser-level connection')

    def _get_tab_kwargs(self, target_id: str, browser_context_id: Optional[str] = None) -> dict:
        """
        Get kwargs for creating a tab based on the WebSocket address.
        If the WebSocket address is set, the tab will be created with the WebSocket address.
        Otherwise, the tab will be created with the connection port and target ID.

        Args:
            target_id: Target ID of the tab.
            browser_context_id: Browser context ID of the tab.

        Returns:
            Dict of kwargs for creating a tab.
        """
        kwargs: dict[str, Any] = {
            'target_id': target_id,
            'browser_context_id': browser_context_id,
        }
        if self._ws_address:
            kwargs['ws_address'] = self._get_tab_ws_address(target_id)
        else:
            kwargs['connection_port'] = self._connection_port
        logger.debug(f'Tab kwargs resolved for {target_id}: using_ws={bool(self._ws_address)}')
        return kwargs

    def _get_tab_ws_address(self, tab_id: str) -> str:
        """
        Get WebSocket address for a specific tab, preserving any query or fragment
        components present in the original browser-level WebSocket URL.

        This ensures authentication tokens passed via query string (e.g.,
        ws://host/devtools/browser/abc?token=XYZ) are retained when switching
        to the page-level endpoint (devtools/page/<tab_id>), which is critical
        for providers like Browserless or authenticated CDP proxies.
        """
        if not self._ws_address:
            raise InvalidWebSocketAddress('WebSocket address is not set')

        parts = urlsplit(self._ws_address)
        # Preserve scheme and netloc; build the page path and keep query/fragment
        page_path = f'/devtools/page/{tab_id}'
        ws = urlunsplit((parts.scheme, parts.netloc, page_path, parts.query, parts.fragment))
        logger.debug(f'Resolved tab WebSocket address: {ws}')
        return ws

    @staticmethod
    def _sanitize_proxy_and_extract_auth(
        proxy_server: str,
    ) -> tuple[str, Optional[tuple[str, str]]]:
        """Strip credentials from a proxy URL and return sanitized URL plus (user, pass).

        Accepts inputs like:
        - username:password@host:port
        - http://username:password@host:port
        - socks5://username:password@host:port
        - host:port (no credentials)
        Returns a (sanitized_proxy, (user, pass) | None).
        Ensures scheme is present in the sanitized URL (defaults to http).
        """
        base = proxy_server if '://' in proxy_server else f'http://{proxy_server}'
        parts = urlsplit(base)
        netloc = parts.netloc
        creds: Optional[tuple[str, str]] = None
        if '@' in netloc:
            cred_part, host_part = netloc.split('@', 1)
            if ':' in cred_part:
                user, pwd = cred_part.split(':', 1)
            else:
                user, pwd = cred_part, ''
            creds = (user, pwd)
            sanitized = urlunsplit((
                parts.scheme,
                host_part,
                parts.path,
                parts.query,
                parts.fragment,
            ))
        else:
            # No creds; ensure scheme
            sanitized = urlunsplit((
                parts.scheme,
                parts.netloc,
                parts.path,
                parts.query,
                parts.fragment,
            ))
        return sanitized, creds

    @abstractmethod
    def _get_default_binary_location(self) -> str:
        """Get default browser executable path (implemented by subclasses)."""
        pass


================================================
FILE: pydoll/browser/chromium/chrome.py
================================================
from __future__ import annotations

import logging
import platform
from typing import TYPE_CHECKING, Optional

from pydoll.browser.chromium.base import Browser
from pydoll.browser.managers import ChromiumOptionsManager
from pydoll.exceptions import UnsupportedOS
from pydoll.utils import validate_browser_paths

if TYPE_CHECKING:
    from pydoll.browser.options import ChromiumOptions

logger = logging.getLogger(__name__)


class Chrome(Browser):
    """Chrome browser implementation for CDP automation."""

    def __init__(
        self,
        options: Optional[ChromiumOptions] = None,
        connection_port: Optional[int] = None,
    ):
        """
        Initialize Chrome browser instance.

        Args:
            options: Chrome configuration options (default if None).
            connection_port: CDP WebSocket port (random if None).
        """
        options_manager = ChromiumOptionsManager(options)
        super().__init__(options_manager, connection_port)

    @staticmethod
    def _get_default_binary_location():
        """
        Get default Chrome executable path based on OS.

        Returns:
            Path to Chrome executable.

        Raises:
            UnsupportedOS: If OS is not supported.
            ValueError: If executable not found at default location.
        """
        os_name = platform.system()
        logger.debug(f'Resolving default Chrome binary for OS: {os_name}')

        browser_paths = {
            'Windows': [
                r'C:\Program Files\Google\Chrome\Application\chrome.exe',
                r'C:\Program Files (x86)\Google\Chrome\Application\chrome.exe',
            ],
            'Linux': [
                '/usr/bin/google-chrome',
                '/usr/bin/google-chrome-stable',
            ],
            'Darwin': [
                '/Applications/Google Chrome.app/Contents/MacOS/Google Chrome',
            ],
        }

        browser_path = browser_paths.get(os_name)

        if not browser_path:
            logger.error(f'Unsupported OS: {os_name}')
            raise UnsupportedOS(f'Unsupported OS: {os_name}')

        path = validate_browser_paths(browser_path)
        logger.debug(f'Using Chrome binary: {path}')
        return path


================================================
FILE: pydoll/browser/chromium/edge.py
================================================
from __future__ import annotations

import logging
import platform
from typing import TYPE_CHECKING, Optional

from pydoll.browser.chromium.base import Browser
from pydoll.browser.managers import ChromiumOptionsManager
from pydoll.exceptions import UnsupportedOS
from pydoll.utils import validate_browser_paths

if TYPE_CHECKING:
    from pydoll.browser.options import Options

logger = logging.getLogger(__name__)


class Edge(Browser):
    """Edge browser implementation for CDP automation."""

    def __init__(
        self,
        options: Optional[Options] = None,
        connection_port: Optional[int] = None,
    ):
        """
        Initialize Edge browser instance.

        Args:
            options: Edge configuration options (default if None).
            connection_port: CDP WebSocket port (random if None).
        """
        options_manager = ChromiumOptionsManager(options)
        super().__init__(options_manager, connection_port)

    @staticmethod
    def _get_default_binary_location():
        """
        Get default Edge executable path based on OS.

        Returns:
            Path to Edge executable.

        Raises:
            UnsupportedOS: If OS is not supported.
            ValueError: If executable not found at default location.
        """
        os_name = platform.system()
        logger.debug(f'Resolving default Edge binary for OS: {os_name}')

        browser_paths = {
            'Windows': [
                (
                    r'C:\Program Files\Microsoft\Edge\Application'
                    r'\msedge.exe'
                ),
                (
                    r'C:\Program Files (x86)\Microsoft\Edge'
                    r'\Application\msedge.exe'
                ),
            ],
            'Linux': [
                '/usr/bin/microsoft-edge',
            ],
            'Darwin': [
                ('/Applications/Microsoft Edge.app/Contents/MacOS/Microsoft Edge'),
            ],
        }

        browser_path = browser_paths.get(os_name)

        if not browser_path:
            logger.error(f'Unsupported OS: {os_name}')
            raise UnsupportedOS()

        path = validate_browser_paths(browser_path)
        logger.debug(f'Using Edge binary: {path}')
        return path


================================================
FILE: pydoll/browser/interfaces.py
================================================
from abc import ABC, abstractmethod

from pydoll.constants import PageLoadState


class Options(ABC):
    @property
    @abstractmethod
    def arguments(self) -> list[str]:
        pass

    @property
    @abstractmethod
    def binary_location(self) -> str:
        pass

    @property
    @abstractmethod
    def start_timeout(self) -> int:
        pass

    @abstractmethod
    def add_argument(self, argument: str):
        pass

    @property
    @abstractmethod
    def browser_preferences(self) -> dict:
        pass

    @property
    @abstractmethod
    def headless(self) -> bool:
        pass

    @headless.setter
    @abstractmethod
    def headless(self, headless: bool):
        pass

    @property
    @abstractmethod
    def page_load_state(self) -> PageLoadState:
        pass

    @page_load_state.setter
    @abstractmethod
    def page_load_state(self, state: PageLoadState):
        pass


class BrowserOptionsManager(ABC):
    @abstractmethod
    def initialize_options(self) -> Options:
        pass

    @abstractmethod
    def add_default_arguments(self):
        pass


================================================
FILE: pydoll/browser/managers/__init__.py
================================================
from pydoll.browser.managers.browser_options_manager import (
    ChromiumOptionsManager,
)
from pydoll.browser.managers.browser_process_manager import (
    BrowserProcessManager,
)
from pydoll.browser.managers.proxy_manager import ProxyManager
from pydoll.browser.managers.temp_dir_manager import TempDirectoryManager

__all__ = [
    'ChromiumOptionsManager',
    'BrowserProcessManager',
    'ProxyManager',
    'TempDirectoryManager',
]


================================================
FILE: pydoll/browser/managers/browser_options_manager.py
================================================
from __future__ import annotations

import logging
from typing import TYPE_CHECKING, Optional

from pydoll.browser.interfaces import BrowserOptionsManager
from pydoll.browser.options import ChromiumOptions
from pydoll.exceptions import InvalidOptionsObject

if TYPE_CHECKING:
    from pydoll.browser.options import Options

logger = logging.getLogger(__name__)


class ChromiumOptionsManager(BrowserOptionsManager):
    """
    Manages browser options configuration for Chromium-based browsers.

    Handles options creation, validation, and applies default CDP arguments
    for Chrome and Edge browsers.
    """

    def __init__(self, options: Optional[Options] = None):
        self.options = options
        logger.debug(
            f'ChromiumOptionsManager initialized with options='
            f'{type(options).__name__ if options is not None else "None"}'
        )

    def initialize_options(
        self,
    ) -> ChromiumOptions:
        """
        Initialize and validate browser options.

        Creates ChromiumOptions if none provided, validates existing options,
        and applies default CDP arguments.

        Returns:
            Properly configured ChromiumOptions instance.

        Raises:
            InvalidOptionsObject: If provided options is not ChromiumOptions.
        """
        if self.options is None:
            self.options = ChromiumOptions()
            logger.debug('No options provided; created default ChromiumOptions')

        if not isinstance(self.options, ChromiumOptions):
            logger.error(f'Invalid options type: {type(self.options)}; expected ChromiumOptions')
            raise InvalidOptionsObject(f'Expected ChromiumOptions, got {type(self.options)}')

        self.add_default_arguments()
        logger.debug('Options initialized and default arguments applied')
        return self.options

    def add_default_arguments(self):
        """Add default arguments required for CDP integration."""
        logger.debug('Adding default arguments for Chromium-based browsers')
        self.options.add_argument('--no-first-run')
        self.options.add_argument('--no-default-browser-check')


================================================
FILE: pydoll/browser/managers/browser_process_manager.py
================================================
import logging
import subprocess
from typing import Callable, Optional

logger = logging.getLogger(__name__)


class BrowserProcessManager:
    """
    Manages browser process lifecycle for CDP automation.

    Handles process creation, monitoring, and termination with proper
    resource cleanup and graceful shutdown.
    """

    def __init__(
        self,
        process_creator: Optional[Callable[[list[str]], subprocess.Popen]] = None,
    ):
        """
        Initialize browser process manager.

        Args:
            process_creator: Custom function to create browser processes.
                Must accept command list and return subprocess.Popen object.
                Uses default subprocess implementation if None.
        """
        self._process_creator = process_creator or self._default_process_creator
        self._process: Optional[subprocess.Popen] = None
        logger.debug(
            f'BrowserProcessManager initialized; custom process_creator={bool(process_creator)}'
        )

    def start_browser_process(
        self,
        binary_location: str,
        port: int,
        arguments: list[str],
    ) -> subprocess.Popen:
        """
        Launch browser process with CDP debugging enabled.

        Args:
            binary_location: Path to browser executable.
            port: TCP port for CDP WebSocket connections.
            arguments: Additional command-line arguments.

        Returns:
            Started browser process instance.

        Note:
            Automatically adds --remote-debugging-port argument.
        """
        logger.info(f'Starting browser process: {binary_location} on port {port}')
        command = [
            binary_location,
            f'--remote-debugging-port={port}',
            *arguments,
        ]
        logger.debug(f'Command: {command}')
        self._process = self._process_creator(command)
        logger.debug(
            f'Browser process started: pid={self._process.pid if self._process else "unknown"}'
        )
        return self._process

    @staticmethod
    def _default_process_creator(command: list[str]) -> subprocess.Popen:
        """Create browser process with output capture to prevent console clutter."""
        logger.debug(f'Creating process: {command}')
        return subprocess.Popen(command, stdout=subprocess.PIPE, stderr=subprocess.PIPE)

    def stop_process(self):
        """
        Terminate browser process with graceful shutdown.

        Attempts SIGTERM first, then SIGKILL after 15-second timeout.
        Safe to call even if no process is running.
        """
        if self._process:
            logger.info(f'Stopping browser process pid={self._process.pid}')
            self._process.terminate()
            try:
                self._process.wait(timeout=15)
                logger.debug('Process terminated gracefully')
            except subprocess.TimeoutExpired:
                logger.warning('Process did not terminate in 15s; sending SIGKILL')
                self._process.kill()
                logger.debug('Process killed')


================================================
FILE: pydoll/browser/managers/proxy_manager.py
================================================
from __future__ import annotations

import logging
from typing import TYPE_CHECKING, Optional

if TYPE_CHECKING:
    from pydoll.browser.options import Options

logger = logging.getLogger(__name__)


class ProxyManager:
    """
    Manages proxy configuration and credentials for CDP automation.

    Extracts embedded credentials from proxy URLs, secures authentication
    information, and sanitizes command-line arguments.
    """

    def __init__(self, options: Options):
        """
        Initialize proxy manager with browser options.

        Args:
            options: Browser options potentially containing proxy configuration.
                Will be modified if credentials are found.
        """
        self.options = options
        logger.debug('ProxyManager initialized with options')

    def get_proxy_credentials(self) -> tuple[bool, tuple[Optional[str], Optional[str]]]:
        """
        Extract and secure proxy authentication credentials.

        Searches for proxy settings, extracts embedded credentials,
        and sanitizes options to remove credential exposure.

        Returns:
            Tuple of (has_private_proxy, (username, password)).
        """
        private_proxy = False
        credentials: tuple[Optional[str], Optional[str]] = (None, None)

        proxy_arg = self._find_proxy_argument()

        if proxy_arg is not None:
            index, proxy_value = proxy_arg
            has_credentials, username, password, clean_proxy = self._parse_proxy(proxy_value)

            if has_credentials:
                self._update_proxy_argument(index, clean_proxy)
                private_proxy = True
                credentials = (username, password)
                logger.debug(
                    f'Proxy credentials extracted (user_set={bool(username)}); argument sanitized'
                )
            else:
                logger.debug('Proxy configured without embedded credentials')

        return private_proxy, credentials

    def _find_proxy_argument(self) -> Optional[tuple[int, str]]:
        """
        Find proxy server configuration in browser options.

        Returns:
            Tuple of (index, proxy_url) if found, None otherwise.
        """
        for index, arg in enumerate(self.options.arguments):
            if arg.startswith('--proxy-server='):
                value = arg.split('=', 1)[1]
                logger.debug(f'Found proxy argument at index {index}: {value}')
                return index, value
        return None

    @staticmethod
    def _parse_proxy(proxy_value: str) -> tuple[bool, Optional[str], Optional[str], str]:
        """
        Parse proxy URL to extract authentication credentials.

        Args:
            proxy_value: Proxy URL potentially containing username:password@server:port.

        Returns:
            Tuple of (has_credentials, username, password, clean_proxy_url).
        """
        if '@' not in proxy_value:
            return False, None, None, proxy_value

        try:
            scheme = ''
            has_scheme = False
            if '://' in proxy_value:
                scheme, proxy_value = proxy_value.split('://', 1)
                has_scheme = True

            creds_part, server_part = proxy_value.split('@', 1)
            username, password = creds_part.split(':', 1)

            clean_proxy = f'{scheme}://{server_part}' if has_scheme else server_part
            return True, username, password, clean_proxy
        except ValueError:
            return False, None, None, proxy_value

    def _update_proxy_argument(self, index: int, clean_proxy: str) -> None:
        """Replace proxy argument with credential-free version."""
        self.options.arguments[index] = f'--proxy-server={clean_proxy}'
        logger.debug(f'Proxy argument updated at index {index}: {clean_proxy}')


================================================
FILE: pydoll/browser/managers/temp_dir_manager.py
================================================
import logging
import os
import shutil
import time
from pathlib import Path
from tempfile import TemporaryDirectory
from typing import Callable

logger = logging.getLogger(__name__)


class TempDirectoryManager:
    """
    Manages temporary directory lifecycle for CDP browser automation.

    Creates isolated temporary directories for browser profiles and handles
    secure cleanup with retry mechanisms for locked files.
    """

    def __init__(self, temp_dir_factory: Callable[[], TemporaryDirectory] = TemporaryDirectory):
        """
        Initialize temporary directory manager.

        Args:
            temp_dir_factory: Function to create temporary directories.
                Must return TemporaryDirectory-compatible object.
        """
        self._temp_dir_factory = temp_dir_factory
        self._temp_dirs: list[TemporaryDirectory] = []
        logger.debug('TempDirectoryManager initialized')

    def create_temp_dir(self) -> TemporaryDirectory:
        """
        Create and track new temporary directory for browser use.

        Returns:
            TemporaryDirectory object for browser --user-data-dir argument.
        """
        temp_dir = self._temp_dir_factory()
        self._temp_dirs.append(temp_dir)
        logger.debug(f'Created temp directory: {temp_dir.name}')
        return temp_dir

    @staticmethod
    def retry_process_file(func: Callable[[str], None], path: str, retry_times: int = 10):
        """
        Execute file operation with retry logic for locked files.

        Args:
            func: Function to execute on path.
            path: File or directory path to operate on.
            retry_times: Maximum retry attempts (negative = unlimited).

        Raises:
            PermissionError: If operation fails after all retries.
        """
        retry_time = 0
        while retry_times < 0 or retry_time < retry_times:
            retry_time += 1
            try:
                func(path)
                break
            except PermissionError:
                time.sleep(0.1)
                logger.debug(
                    f'Retrying file operation due to PermissionError (attempt {retry_time})'
                )
        else:
            raise PermissionError()

    def handle_cleanup_error(self, func: Callable[[str], None], path: str, exc_info: tuple):
        """
        Handle errors during directory cleanup with browser-specific workarounds.

        Args:
            func: Original function that failed.
            path: Path that could not be processed.
            exc_info: Exception information tuple.

        Note:
            Handles Chromium-specific locked files like CrashpadMetrics.
        """
        matches = ['CrashpadMetrics-active.pma']
        match_substrings = ['Safe Browsing', 'Safe Browsing Cookies']
        # Extra patterns commonly locked on Windows; compare case-insensitively
        windows_locked_substrings = [
            '\\cache\\',
            '/cache/',
            'no_vary_search',
            'journal.baj',
            '\\network\\cookies',
            '/network/cookies',
            'cookies-journal',
            '\\local storage\\',
            '/local storage/',
            '\\local storage\\leveldb\\',
            '/local storage/leveldb/',
            'leveldb',
            'indexeddb',
        ]
        exc_type, exc_value, _ = exc_info

        if exc_type is PermissionError:
            filename = Path(path).name
            # Known Chromium files that may remain locked briefly on Windows
            path_lc = path.lower()
            windows_match = os.name == 'nt' and any(
                substr in path_lc for substr in windows_locked_substrings
            )
            if (
                filename in matches
                or any(substr in path for substr in match_substrings)
                or windows_match
            ):
                try:
                    self.retry_process_file(func, path)
                    return
                except PermissionError:
                    logger.warning(f'Ignoring locked Chrome file during cleanup: {path}')
                    return
        elif exc_type is OSError:
            return
        raise exc_value

    def cleanup(self):
        """
        Remove all tracked temporary directories with error handling.

        Uses custom error handler for browser-specific file lock issues.
        Continues cleanup even if some files resist deletion.
        """
        for temp_dir in self._temp_dirs:
            logger.info(f'Cleaning up temp directory: {temp_dir.name}')
            shutil.rmtree(temp_dir.name, onerror=self.handle_cleanup_error)
            remaining = Path(temp_dir.name)
            if not remaining.exists():
                continue

            for attempt in range(10):
                time.sleep(0.2)
                try:
                    shutil.rmtree(temp_dir.name, onerror=self.handle_cleanup_error)
                except Exception:  # noqa: BLE001 - best-effort cleanup
                    pass
                if not remaining.exists():
                    logger.debug(
                        f'Temp directory removed after retry #{attempt + 1}: {temp_dir.name}'
                    )
                    break
            if remaining.exists():
                logger.warning(
                    f'Temp directory still present after retries (leftover files may remain): '
                    f'{temp_dir.name}'
                )


================================================
FILE: pydoll/browser/options.py
================================================
from contextlib import suppress

from pydoll.browser.interfaces import Options
from pydoll.constants import PageLoadState
from pydoll.exceptions import (
    ArgumentAlreadyExistsInOptions,
    ArgumentNotFoundInOptions,
    WrongPrefsDict,
)


class ChromiumOptions(Options):
    """
    A class to manage command-line options for a browser instance.

    This class allows the user to specify command-line arguments and
    the binary location of the browser executable.
    """

    def __init__(self):
        """
        Initializes the Options instance.

        Sets up an empty list for command-line arguments and a string
        for the binary location of the browser.
        """
        self._arguments = []
        self._binary_location = ''
        self._start_timeout = 10
        self._browser_preferences = {}
        self._headless = False
        self._webrtc_leak_protection = False
        self._page_load_state = PageLoadState.COMPLETE

    @property
    def arguments(self) -> list[str]:
        """
        Gets the list of command-line arguments.

        Returns:
            list: A list of command-line arguments added to the options.
        """
        return self._arguments

    @arguments.setter
    def arguments(self, args_list: list[str]):
        """
        Sets the list of command-line arguments.

        Args:
            args_list (list): A list of command-line arguments.
        """
        self._arguments = args_list

    @property
    def binary_location(self) -> str:
        """
        Gets the location of the browser binary.

        Returns:
            str: The file path to the browser executable.
        """
        return self._binary_location

    @binary_location.setter
    def binary_location(self, location: str):
        """
        Sets the location of the browser binary.

        Args:
            location (str): The file path to the browser executable.
        """
        self._binary_location = location

    @property
    def start_timeout(self) -> int:
        """
        Gets the timeout to verify the browser's running state.

        Returns:
            int: The timeout in seconds.
        """
        return self._start_timeout

    @start_timeout.setter
    def start_timeout(self, timeout: int):
        """
        Sets the timeout to verify the browser's running state.

        Args:
            timeout (int): The timeout in seconds.
        """
        self._start_timeout = timeout

    def add_argument(self, argument: str):
        """
        Adds a command-line argument to the options.

        Args:
            argument (str): The command-line argument to be added.

        Raises:
            ArgumentAlreadyExistsInOptions: If the argument is already in the list of arguments.
        """
        if argument not in self._arguments:
            self._arguments.append(argument)
        else:
            raise ArgumentAlreadyExistsInOptions(f'Argument already exists: {argument}')

    def remove_argument(self, argument: str):
        """
        Removes a command-line argument from the options.

        Args:
            argument (str): The command-line argument to be removed.

        Raises:
            ArgumentNotFoundInOptions: If the argument is not in the list of arguments.
        """
        if argument not in self._arguments:
            raise ArgumentNotFoundInOptions(f'Argument not found: {argument}')
        self._arguments.remove(argument)

    @property
    def browser_preferences(self) -> dict:
        return self._browser_preferences

    @browser_preferences.setter
    def browser_preferences(self, preferences: dict):
        if not isinstance(preferences, dict):
            raise ValueError('The experimental options value must be a dict.')

        if preferences.get('prefs'):
            raise WrongPrefsDict
        self._browser_preferences = {**self._browser_preferences, **preferences}

    def _set_pref_path(self, path: list, value):
        """
        Safely sets a nested value in self._browser_preferences,
        creating intermediate dicts as needed.

        Arguments:
            path -- List of keys representing the nested
                    path (e.g., ['plugins', 'always_open_pdf_externally'])
            value -- The value to set at the given path
        """
        d = self._browser_preferences
        for key in path[:-1]:
            d = d.setdefault(key, {})
        d[path[-1]] = value

    def _get_pref_path(self, path: list):
        """
        Safely gets a nested value from self._browser_preferences.

        Arguments:
            path -- List of keys representing the nested
                    path (e.g., ['plugins', 'always_open_pdf_externally'])

        Returns:
            The value at the given path, or None if path doesn't exist
        """
        nested_preferences = self._browser_preferences
        with suppress(KeyError, TypeError):
            for key in path:
                nested_preferences = nested_preferences[key]
            return nested_preferences
        return None

    def set_default_download_directory(self, path: str):
        """
        Set the default directory where downloaded files will be saved.

        Usage: Sets the 'download.default_directory' preference for Chrome.

        Arguments:
            path: Absolute path to the download destination folder.
        """
        self._set_pref_path(['download', 'default_directory'], path)

    def set_accept_languages(self, languages: str):
        """
        Set the accepted languages for the browser.

        Usage: Sets the 'intl.accept_languages' preference.

        Arguments:
            languages: A comma-separated string of language codes (e.g., 'pt-BR,pt,en-US,en').
        """
        self._set_pref_path(['intl', 'accept_languages'], languages)

    @property
    def prompt_for_download(self) -> bool:
        return self._get_pref_path(['download', 'prompt_for_download'])

    @prompt_for_download.setter
    def prompt_for_download(self, enabled: bool):
        """
        Enable or disable download prompt confirmation.

        Usage: Sets the 'download.prompt_for_download' preference.

        Arguments:
            enabled: If True, Chrome will ask for confirmation before downloading.
        """
        self._set_pref_path(['download', 'prompt_for_download'], enabled)

    @property
    def block_popups(self) -> bool:
        return self._get_pref_path(['profile', 'default_content_setting_values', 'popups']) == 0

    @block_popups.setter
    def block_popups(self, block: bool):
        """
        Block or allow pop-up windows.

        Usage: Sets the 'profile.default_content_setting_values.popups' preference.

        Arguments:
            block: If True, pop-ups will be blocked (value = 0); otherwise allowed (value = 1).
        """
        self._set_pref_path(
            ['profile', 'default_content_setting_values', 'popups'], 0 if block else 1
        )

    @property
    def password_manager_enabled(self) -> bool:
        return self._get_pref_path(['profile', 'password_manager_enabled'])

    @password_manager_enabled.setter
    def password_manager_enabled(self, enabled: bool):
        """
        Enable or disable Chrome's password manager.

        Usage: Sets the 'profile.password_manager_enabled' preference.

        Arguments:
            enabled: If True, the password manager is active.
        """
        self._set_pref_path(['profile', 'password_manager_enabled'], enabled)
        self._set_pref_path(['credentials_enable_service'], enabled)

    @property
    def block_notifications(self) -> bool:
        block_notifications_true_value = 2
        return (
            self._get_pref_path(['profile', 'default_content_setting_values', 'notifications'])
            == block_notifications_true_value
        )

    @block_notifications.setter
    def block_notifications(self, block: bool):
        """
        Block or allow site notifications.

        Usage: Sets the 'profile.default_content_setting_values.notifications' preference.

        Arguments:
            block: If True, notifications will be blocked (value = 2);
            otherwise allowed (value = 1).
        """
        self._set_pref_path(
            ['profile', 'default_content_setting_values', 'notifications'],
            2 if block else 1,
        )

    @property
    def allow_automatic_downloads(self) -> bool:
        return (
            self._get_pref_path([
                'profile',
                'default_content_setting_values',
                'automatic_downloads',
            ])
            == 1
        )

    @allow_automatic_downloads.setter
    def allow_automatic_downloads(self, allow: bool):
        """
        Allow or block automatic multiple downloads.

        Usage: Sets the 'profile.default_content_setting_values.automatic_downloads' preference.

        Arguments:
            allow: If True, automatic downloads are allowed (value = 1);
            otherwise blocked (value = 2).
        """
        self._set_pref_path(
            ['profile', 'default_content_setting_values', 'automatic_downloads'],
            1 if allow else 2,
        )

    @property
    def open_pdf_externally(self) -> bool:
        return self._get_pref_path(['plugins', 'always_open_pdf_externally'])

    @open_pdf_externally.setter
    def open_pdf_externally(self, enabled: bool):
        """
        Block or allow geolocation access.

        Usage: Sets the 'profile.managed_default_content_settings.geolocation' preference.

        Arguments:
            block: If True, location access is blocked (value = 2); otherwise allowed (value = 1).
        """
        self._set_pref_path(['plugins', 'always_open_pdf_externally'], enabled)

    @property
    def headless(self) -> bool:
        return self._headless

    @headless.setter
    def headless(self, headless: bool):
        self._headless = headless
        has_argument = '--headless' in self.arguments
        methods_map = {True: self.add_argument, False: self.remove_argument}
        if headless == has_argument:
            return
        methods_map[headless]('--headless')

    @property
    def webrtc_leak_protection(self) -> bool:
        return self._webrtc_leak_protection

    @webrtc_leak_protection.setter
    def webrtc_leak_protection(self, enabled: bool):
        self._webrtc_leak_protection = enabled
        argument = '--force-webrtc-ip-handling-policy=disable_non_proxied_udp'
        has_argument = argument in self.arguments
        methods_map = {True: self.add_argument, False: self.remove_argument}
        if enabled == has_argument:
            return
        methods_map[enabled](argument)

    @property
    def page_load_state(self) -> PageLoadState:
        return self._page_load_state

    @page_load_state.setter
    def page_load_state(self, state: PageLoadState):
        self._page_load_state = state


================================================
FILE: pydoll/browser/requests/__init__.py
================================================
"""
This module provides HTTP client functionality using the browser's fetch API.
It allows making HTTP requests within the browser context, reusing cookies and headers.
"""

from .har_recorder import HarCapture
from .request import Request
from .response import Response

__all__ = ['HarCapture', 'Request', 'Response']


================================================
FILE: pydoll/browser/requests/har_recorder.py
================================================
"""HAR network recorder for capturing and replaying browser network traffic.

This module provides the internal recording engine (HarRecorder) and the
user-facing recording object (HarCapture) that together enable HAR 1.2
capture and export from browser sessions.
"""

from __future__ import annotations

import asyncio
import base64
import json
import logging
from datetime import datetime, timezone
from importlib.metadata import version as _pkg_version
from pathlib import Path
from typing import TYPE_CHECKING, Any, Callable, cast
from urllib.parse import parse_qs, urlparse

from pydoll.commands.network_commands import NetworkCommands
from pydoll.protocol.network.events import (
    DataReceivedEvent,
    LoadingFailedEvent,
    LoadingFinishedEvent,
    NetworkEvent,
    RequestWillBeSentEvent,
    RequestWillBeSentExtraInfoEvent,
    ResponseReceivedEvent,
    ResponseReceivedExtraInfoEvent,
)
from pydoll.protocol.network.har_types import (
    Har,
    HarContent,
    HarCookie,
    HarCreator,
    HarEntry,
    HarHeader,
    HarLog,
    HarPostData,
    HarQueryParam,
    HarRequest,
    HarResponse,
    HarTimings,
)
from pydoll.protocol.network.types import ResourceType

if TYPE_CHECKING:
    from pydoll.browser.tab import Tab
    from pydoll.protocol.network.methods import GetResponseBodyResponse
    from pydoll.protocol.network.types import ResourceTiming
    from pydoll.protocol.network.types import Response as CDPResponse

logger = logging.getLogger(__name__)

_PYDOLL_CREATOR_NAME = 'pydoll'
_HTTP_NOT_MODIFIED = 304


def _get_pydoll_version() -> str:
    """Get the installed pydoll version."""
    try:
        return _pkg_version('pydoll')
    except Exception:
        return 'unknown'


class HarRecorder:
    """Internal engine that listens to CDP network events and builds HAR entries.

    This class registers callbacks for 7 CDP Network events, correlates them
    by requestId, and builds HAR 1.2 entries. It is not intended for direct
    use — instead, use ``tab.request.record()`` which wraps this engine.
    """

    def __init__(self, tab: Tab, resource_types: list[ResourceType] | None = None):
        self._tab = tab
        self._resource_types = frozenset(resource_types) if resource_types else None
        self._callback_ids: list[int] = []
        self._pending: dict[str, dict[str, Any]] = {}
        self._entries: list[HarEntry] = []
        self._start_time: datetime | None = None
        self._network_was_enabled: bool = False
        self._body_tasks: list[asyncio.Task] = []
        self._data_received_sizes: dict[str, int] = {}

    async def start(self) -> None:
        """Start recording network traffic.

        Enables network events if not already on, and registers callbacks
        for the 7 CDP events needed to build HAR entries.
        """
        if not self._tab.network_events_enabled:
            await self._tab.enable_network_events()
            self._network_was_enabled = True
            logger.debug('HAR recorder enabled network events')

        self._start_time = datetime.now(tz=timezone.utc)

        _cb = Callable[[dict], Any]
        events_and_handlers: list[tuple[str, _cb]] = [
            (NetworkEvent.REQUEST_WILL_BE_SENT, cast(_cb, self._on_request_will_be_sent)),
            (NetworkEvent.REQUEST_WILL_BE_SENT_EXTRA_INFO, cast(_cb, self._on_request_extra_info)),
            (NetworkEvent.RESPONSE_RECEIVED, cast(_cb, self._on_response_received)),
            (NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO, cast(_cb, self._on_response_extra_info)),
            (NetworkEvent.DATA_RECEIVED, cast(_cb, self._on_data_received)),
            (NetworkEvent.LOADING_FINISHED, cast(_cb, self._on_loading_finished)),
            (NetworkEvent.LOADING_FAILED, cast(_cb, self._on_loading_failed)),
        ]

        for event_name, handler in events_and_handlers:
            callback_id = await self._tab.on(event_name, handler)
            self._callback_ids.append(callback_id)

        logger.info('HAR recorder started, registered %d callbacks', len(self._callback_ids))

    async def stop(self) -> None:
        """Stop recording and clean up.

        Removes all registered callbacks, waits for pending body fetches,
        flushes pending entries, and optionally disables network events.
        """
        for callback_id in self._callback_ids:
            await self._tab.remove_callback(callback_id)
        self._callback_ids.clear()

        if self._body_tasks:
            await asyncio.gather(*self._body_tasks, return_exceptions=True)
            self._body_tasks.clear()

        self._flush_pending()

        if self._network_was_enabled:
            await self._tab.disable_network_events()
            self._network_was_enabled = False

        logger.info('HAR recorder stopped, captured %d entries', len(self._entries))

    def _on_request_will_be_sent(self, event: RequestWillBeSentEvent) -> None:
        """Handle Network.requestWillBeSent event."""
        params = event['params']
        request_id = params['requestId']
        request_data = params['request']
        resource_type = params.get('type', '')
        redirect_response = params.get('redirectResponse')

        if self._resource_types and resource_type not in self._resource_types:
            return

        if redirect_response and request_id in self._pending:
            self._finalize_redirect_entry(request_id, redirect_response)

        self._pending[request_id] = {
            'url': request_data.get('url', ''),
            'method': request_data.get('method', 'GET'),
            'request_headers': request_data.get('headers', {}),
            'post_data': request_data.get('postData'),
            'wall_time': params['wallTime'],
            'resource_type': params.get('type', ''),
            'timestamp': params['timestamp'],
        }
        logger.debug('HAR: request will be sent: %s %s', request_id, request_data.get('url', ''))

    def _on_request_extra_info(self, event: RequestWillBeSentExtraInfoEvent) -> None:
        """Handle Network.requestWillBeSentExtraInfo event."""
        params = event['params']
        request_id = params['requestId']
        pending = self._pending.get(request_id)
        if not pending:
            return

        extra_headers = params.get('headers', {})
        if extra_headers:
            pending['request_headers_extra'] = extra_headers
        logger.debug('HAR: request extra info: %s', request_id)

    def _on_response_received(self, event: ResponseReceivedEvent) -> None:
        """Handle Network.responseReceived event."""
        params = event['params']
        request_id = params['requestId']
        pending = self._pending.get(request_id)
        if not pending:
            return

        response = params['response']
        pending['status'] = response['status']
        pending['status_text'] = response['statusText']
        pending['response_headers'] = response.get('headers', {})
        pending['mime_type'] = response['mimeType']
        pending['protocol'] = response.get('protocol', '')
        pending['timing'] = response.get('timing')
        pending['remote_ip'] = response.get('remoteIPAddress', '')
        pending['connection_id'] = str(response.get('connectionId', ''))
        pending['encoded_data_length'] = response.get('encodedDataLength', 0)
        pending['response_timestamp'] = params['timestamp']
        logger.debug('HAR: response received: %s status=%s', request_id, response['status'])

    def _on_response_extra_info(self, event: ResponseReceivedExtraInfoEvent) -> None:
        """Handle Network.responseReceivedExtraInfo event."""
        params = event['params']
        request_id = params['requestId']
        pending = self._pending.get(request_id)
        if not pending:
            return

        extra_headers = params.get('headers', {})
        if extra_headers:
            pending['response_headers_extra'] = extra_headers
        status_code = params.get('statusCode')
        if status_code is not None:
            pending['extra_status_code'] = status_code
        logger.debug('HAR: response extra info: %s', request_id)

    def _on_data_received(self, event: DataReceivedEvent) -> None:
        """Handle Network.dataReceived event.

        Accumulates body chunk bytes per requestId for accurate bodySize.
        """
        params = event['params']
        request_id = params['requestId']
        chunk_size = params['encodedDataLength']
        self._data_received_sizes[request_id] = (
            self._data_received_sizes.get(request_id, 0) + chunk_size
        )

    def _on_loading_finished(self, event: LoadingFinishedEvent) -> None:
        """Handle Network.loadingFinished event."""
        params = event['params']
        request_id = params['requestId']
        pending = self._pending.get(request_id)
        if not pending:
            return

        pending['transfer_size'] = params['encodedDataLength']
        pending['finished_timestamp'] = params['timestamp']
        pending['body_bytes'] = self._data_received_sizes.pop(request_id, -1)

        task = asyncio.create_task(self._finalize_entry(request_id))
        self._body_tasks.append(task)
        task.add_done_callback(
            lambda t: self._body_tasks.remove(t) if t in self._body_tasks else None
        )
        logger.debug('HAR: loading finished: %s', request_id)

    def _on_loading_failed(self, event: LoadingFailedEvent) -> None:
        """Handle Network.loadingFailed event."""
        params = event['params']
        request_id = params['requestId']
        pending = self._pending.pop(request_id, None)
        if not pending:
            return

        self._data_received_sizes.pop(request_id, None)
        pending.setdefault('status', 0)
        pending.setdefault('status_text', params.get('errorText', 'Failed'))
        pending['error_text'] = params['errorText']
        pending['canceled'] = params.get('canceled', False)

        entry = self._build_entry(pending)
        self._entries.append(entry)
        logger.debug('HAR: loading failed: %s error=%s', request_id, params.get('errorText'))

    async def _finalize_entry(self, request_id: str) -> None:
        """Fetch response body and build the final HAR entry."""
        pending = self._pending.pop(request_id, None)
        if not pending:
            return

        body, base64_encoded = await self._fetch_response_body(request_id)
        pending['response_body'] = body
        pending['response_body_base64'] = base64_encoded

        entry = self._build_entry(pending)
        self._entries.append(entry)

    def _finalize_redirect_entry(self, request_id: str, redirect_response: CDPResponse) -> None:
        """Finalize a redirect entry before starting a new pending entry."""
        pending = self._pending.pop(request_id, None)
        if not pending:
            return
        pending['body_bytes'] = self._data_received_sizes.pop(request_id, -1)

        pending['status'] = redirect_response.get('status', 302)
        pending['status_text'] = redirect_response.get('statusText', '')
        pending['response_headers'] = redirect_response.get('headers', {})
        pending['mime_type'] = redirect_response.get('mimeType', '')
        pending['protocol'] = redirect_response.get('protocol', '')
        pending['timing'] = redirect_response.get('timing')

        entry = self._build_entry(pending)
        self._entries.append(entry)
        logger.debug(
            'HAR: redirect finalized: %s → %s', request_id, redirect_response.get('status')
        )

    def _flush_pending(self) -> None:
        """Convert remaining pending entries (requests with no response) into HAR entries."""
        for request_id in list(self._pending.keys()):
            pending = self._pending.pop(request_id)
            pending.setdefault('status', 0)
            pending.setdefault('status_text', '(pending)')
            entry = self._build_entry(pending)
            self._entries.append(entry)
        logger.debug('HAR: flushed pending entries')

    async def _fetch_response_body(self, request_id: str) -> tuple[str, bool]:
        """Fetch the response body via Network.getResponseBody.

        Returns:
            Tuple of (body_text, is_base64_encoded). Returns ('', False) on failure.
        """
        try:
            command = NetworkCommands.get_response_body(request_id)
            response: GetResponseBodyResponse = await self._tab._execute_command(command)
            body_result = response['result']
            return body_result['body'], body_result['base64Encoded']
        except Exception:
            logger.debug('HAR: failed to fetch response body for %s', request_id)
            return '', False

    def _build_entry(self, pending: dict[str, Any]) -> HarEntry:
        """Build a HAR entry from accumulated pending data."""
        req_hdrs = pending.get('request_headers_extra') or pending.get('request_headers', {})
        resp_hdrs = pending.get('response_headers_extra') or pending.get('response_headers', {})
        url = pending.get('url', '')
        protocol = self._normalize_http_version(pending.get('protocol', ''))
        post_data_text = pending.get('post_data')

        har_request = self._build_har_request(url, pending, req_hdrs, protocol, post_data_text)
        har_response = self._build_har_response(pending, resp_hdrs, protocol)

        response_ts: float = pending.get('response_timestamp', 0)
        finished_ts: float = pending.get('finished_timestamp', 0)
        receive_ms: float | None = None
        if response_ts and finished_ts and finished_ts > response_ts:
            receive_ms = (finished_ts - response_ts) * 1000

        har_timings = self._build_har_timings(pending.get('timing'), receive_ms)
        # Sum without ssl — connect already includes it per HAR 1.2 spec
        _phases = (
            har_timings['blocked'],
            har_timings['dns'],
            har_timings['connect'],
            har_timings['send'],
            har_timings['wait'],
            har_timings['receive'],
        )
        total_time = sum(v for v in _phases if v > 0)

        entry = HarEntry(
            startedDateTime=self._wall_time_to_iso(pending.get('wall_time', 0)),
            time=round(total_time, 2),
            request=har_request,
            response=har_response,
            cache={},
            timings=har_timings,
        )

        for key, field in [
            ('remote_ip', 'serverIPAddress'),
            ('connection_id', 'connection'),
            ('resource_type', '_resourceType'),
        ]:
            if pending.get(key, ''):
                entry[field] = pending[key]  # type: ignore[literal-required]

        return entry

    def _build_har_request(
        self,
        url: str,
        pending: dict[str, Any],
        headers: dict[str, str],
        protocol: str,
        post_data_text: str | None,
    ) -> HarRequest:
        """Build the HarRequest portion of an entry."""
        req_cookies = self._parse_request_cookies(headers)
        har_request = HarRequest(
            method=pending.get('method', 'GET'),
            url=url,
            httpVersion=protocol,
            cookies=req_cookies,
            headers=self._headers_dict_to_list(headers),
            queryString=self._parse_query_string(url),
            headersSize=-1,
            bodySize=len(post_data_text.encode('utf-8')) if post_data_text else 0,
        )
        if post_data_text:
            ct = headers.get('Content-Type', headers.get('content-type', ''))
            har_request['postData'] = HarPostData(mimeType=ct, text=post_data_text)
        return har_request

    def _build_har_response(
        self,
        pending: dict[str, Any],
        headers: dict[str, str],
        protocol: str,
    ) -> HarResponse:
        """Build the HarResponse portion of an entry."""
        body = pending.get('response_body', '')
        is_base64 = pending.get('response_body_base64', False)
        status = pending.get('extra_status_code', pending.get('status', 0))

        if body and is_base64:
            try:
                content_size = len(base64.b64decode(body))
            except Exception:
                content_size = len(body)
        elif body:
            content_size = len(body.encode('utf-8'))
        else:
            content_size = 0

        har_content = HarContent(size=content_size, mimeType=pending.get('mime_type', ''))
        if body:
            har_content['text'] = body
            if is_base64:
                har_content['encoding'] = 'base64'

        # bodySize from dataReceived chunks (actual body bytes, no header overhead)
        # For 304 (cache hit), bodySize must be 0 per HAR spec
        # When body_bytes is 0 but content exists (e.g. file:// protocol),
        # fall back to content_size for consistency with content.size/text.
        body_bytes = pending.get('body_bytes', -1)
        if status == _HTTP_NOT_MODIFIED:
            body_size = 0
        elif body_bytes > 0:
            body_size = body_bytes
        elif content_size > 0:
            body_size = content_size
        else:
            body_size = -1

        redirect = headers.get('Location', headers.get('location', ''))
        resp_cookies = self._parse_response_cookies(headers)
        return HarResponse(
            status=status,
            statusText=pending.get('status_text', ''),
            httpVersion=protocol,
            cookies=resp_cookies,
            headers=self._headers_dict_to_list(headers),
            content=har_content,
            redirectURL=redirect,
            headersSize=-1,
            bodySize=body_size,
        )

    @staticmethod
    def _build_har_timings(
        timing: ResourceTiming | None,
        receive_ms: float | None = None,
    ) -> HarTimings:
        """Convert CDP ResourceTiming to HAR timings (in milliseconds).

        Args:
            timing: CDP ResourceTiming from responseReceived.
            receive_ms: Calculated receive time from monotonic timestamps
                (loadingFinished.timestamp - responseReceived.timestamp).
                When provided, overrides the header-based calculation.
        """
        rcv = round(receive_ms, 3) if receive_ms is not None else 0
        if not timing:
            return HarTimings(
                blocked=-1,
                dns=-1,
                connect=-1,
                ssl=-1,
                send=0,
                wait=0,
                receive=rcv,
            )

        dns_s: float = timing.get('dnsStart', -1)
        dns_e: float = timing.get('dnsEnd', -1)
        con_s: float = timing.get('connectStart', -1)
        con_e: float = timing.get('connectEnd', -1)
        ssl_s: float = timing.get('sslStart', -1)
        ssl_e: float = timing.get('sslEnd', -1)
        snd_s: float = timing.get('sendStart', 0)
        snd_e: float = timing.get('sendEnd', 0)
        rh_s: float = timing.get('receiveHeadersStart', 0)

        def _phase(s: float, e: float) -> float:
            return round(max(e - s, 0), 3) if s >= 0 and e >= 0 else -1

        first = dns_s if dns_s >= 0 else (con_s if con_s >= 0 else snd_s)
        return HarTimings(
            blocked=round(max(first, 0), 3),
            dns=_phase(dns_s, dns_e),
            connect=_phase(con_s, con_e),
            ssl=_phase(ssl_s, ssl_e),
            send=round(max(snd_e - snd_s, 0), 3),
            wait=round(max(rh_s - snd_e, 0), 3),
            receive=rcv,
        )

    @staticmethod
    def _normalize_http_version(protocol: str) -> str:
        """Normalize CDP protocol string to HAR httpVersion format.

        CDP reports protocols like 'h2', 'h3', 'http/1.0', 'http/1.1',
        or non-HTTP strings like 'file'. HAR viewers expect uppercase
        HTTP versions (e.g. 'HTTP/1.1', 'h2', 'h3').
        """
        if not protocol:
            return ''
        lower = protocol.lower()
        if lower in {'h2', 'h3', 'h2c'}:
            return lower
        if lower.startswith('http/'):
            return protocol.upper()
        return ''

    @staticmethod
    def _headers_dict_to_list(headers: dict[str, str]) -> list[HarHeader]:
        """Convert a CDP headers dict to a HAR headers list."""
        return [HarHeader(name=name, value=value) for name, value in headers.items()]

    @staticmethod
    def _parse_query_string(url: str) -> list[HarQueryParam]:
        """Parse URL query string into HAR query param list."""
        parsed = urlparse(url)
        if not parsed.query:
            return []

        params = parse_qs(parsed.query, keep_blank_values=True)
        result: list[HarQueryParam] = []
        for name, values in params.items():
            for value in values:
                result.append(HarQueryParam(name=name, value=value))
        return result

    @staticmethod
    def _wall_time_to_iso(wall_time: float) -> str:
        """Convert a CDP wallTime (seconds since epoch) to ISO 8601 string."""
        if not wall_time:
            return datetime.now(tz=timezone.utc).isoformat()
        return datetime.fromtimestamp(wall_time, tz=timezone.utc).isoformat()

    @staticmethod
    def _parse_request_cookies(headers: dict[str, str]) -> list[HarCookie]:
        """Parse request cookies from the Cookie header."""
        cookie_header = headers.get('Cookie', headers.get('cookie', ''))
        if not cookie_header:
            return []

        cookies: list[HarCookie] = []
        for raw_pair in cookie_header.split(';'):
            stripped = raw_pair.strip()
            if '=' not in stripped:
                continue
            name, value = stripped.split('=', 1)
            name = name.strip()
            if name:
                cookies.append(HarCookie(name=name, value=value.strip()))
        return cookies

    @staticmethod
    def _parse_response_cookies(headers: dict[str, str]) -> list[HarCookie]:
        """Parse response cookies from Set-Cookie headers."""
        set_cookie = headers.get('Set-Cookie', headers.get('set-cookie', ''))
        if not set_cookie:
            return []

        cookies: list[HarCookie] = []
        for raw_line in set_cookie.split('\n'):
            stripped_line = raw_line.strip()
            if '=' not in stripped_line:
                continue
            name_value = stripped_line.split(';', 1)[0]
            name, value = name_value.split('=', 1)
            name = name.strip()
            if not name:
                continue
            cookie = HarCookie(name=name, value=value.strip())
            attrs = stripped_line.split(';')[1:]
            for raw_attr in attrs:
                attr_lower = raw_attr.strip().lower()
                if attr_lower == 'httponly':
                    cookie['httpOnly'] = True
                elif attr_lower == 'secure':
                    cookie['secure'] = True
                elif attr_lower.startswith('path='):
                    cookie['path'] = attr_lower.split('=', 1)[1]
                elif attr_lower.startswith('domain='):
                    cookie['domain'] = attr_lower.split('=', 1)[1]
            cookies.append(cookie)
        return cookies


class HarCapture:
    """User-facing object returned by ``tab.request.record()`` context manager.

    Provides access to recorded HAR entries and methods to export the
    recording as a HAR 1.2 file.
    """

    def __init__(self, recorder: HarRecorder):
        self._recorder = recorder

    @property
    def entries(self) -> list[HarEntry]:
        """Return a sorted copy of the recorded HAR entries."""
        return sorted(self._recorder._entries, key=lambda e: e['startedDateTime'])

    def to_dict(self) -> Har:
        """Build a full HAR 1.2 dictionary from the recorded entries.

        Returns:
            A complete HAR 1.2 dict ready for JSON serialization.
        """
        return Har(
            log=HarLog(
                version='1.2',
                creator=HarCreator(
                    name=_PYDOLL_CREATOR_NAME,
                    version=_get_pydoll_version(),
                ),
                pages=[],
                entries=sorted(
                    self._recorder._entries,
                    key=lambda e: e['startedDateTime'],
                ),
            )
        )

    def save(self, path: str | Path) -> None:
        """Save the recording as a HAR 1.2 JSON file.

        Args:
            path: File path to write the HAR file to.
        """
        har_dict = self.to_dict()
        file_path = Path(path)
        file_path.parent.mkdir(parents=True, exist_ok=True)
        with open(file_path, 'w', encoding='utf-8') as f:
            json.dump(har_dict, f, indent=2, ensure_ascii=False)
        logger.info('HAR recording saved to %s (%d entries)', path, len(self._recorder._entries))


================================================
FILE: pydoll/browser/requests/request.py
================================================
"""
This module provides a Request class that mimics the behavior of requests.
It allows making HTTP requests using the browser's fetch API.
"""

from __future__ import annotations

import json as jsonlib
import logging
from collections.abc import AsyncIterator
from contextlib import asynccontextmanager
from typing import TYPE_CHECKING, Any, Callable, Optional, Union, cast
from urllib.parse import parse_qs, urlencode, urlparse, urlunparse

from pydoll.browser.requests.har_recorder import HarCapture, HarRecorder
from pydoll.browser.requests.response import Response
from pydoll.commands.runtime_commands import RuntimeCommands
from pydoll.constants import Scripts
from pydoll.exceptions import HTTPError
from pydoll.protocol.fetch.types import HeaderEntry
from pydoll.protocol.network.events import (
    NetworkEvent,
    RequestWillBeSentEvent,
    RequestWillBeSentExtraInfoEvent,
    ResponseReceivedEvent,
    ResponseReceivedExtraInfoEvent,
    ResponseReceivedExtraInfoEventParams,
)
from pydoll.protocol.network.types import CookieParam, ResourceType

logger = logging.getLogger(__name__)

RequestReceivedEvent = Union[
    ResponseReceivedEvent,
    ResponseReceivedExtraInfoEvent,
]
RequestSentEvent = Union[
    RequestWillBeSentEvent,
    RequestWillBeSentExtraInfoEvent,
]

if TYPE_CHECKING:
    from pydoll.browser.tab import Tab
    from pydoll.protocol.network.events import (
        RequestWillBeSentEventParams,
        RequestWillBeSentExtraInfoEventParams,
        ResponseReceivedEventParams,
    )
    from pydoll.protocol.runtime.methods import EvaluateResponse

    RequestReceivedEventParams = Union[
        ResponseReceivedEventParams,
        ResponseReceivedExtraInfoEventParams,
    ]
    RequestSentEventParams = Union[
        RequestWillBeSentEventParams,
        RequestWillBeSentExtraInfoEventParams,
    ]


class Request:
    """High-level interface for making HTTP requests using the browser's fetch API.

    This class provides a requests-like interface that executes HTTP requests in the
    browser's JavaScript context. All requests inherit the browser's current session
    state including cookies, authentication headers, and other automatic browser
    behaviors. This allows for seamless interaction with websites that require
    authentication or have complex cookie management.

    Key Features:
    - Executes requests in the browser's JavaScript context using fetch API
    - Automatically includes browser cookies and session state
    - Preserves browser's security context and CORS policies
    - Captures both request and response headers for analysis
    - Supports all standard HTTP methods (GET, POST, PUT, DELETE, etc.)

    Note:
    - Headers passed to methods are additional headers, not replacements
    - Browser's automatic headers (User-Agent, Accept, etc.) are preserved
    - Cookies are managed automatically by the browser
    """

    def __init__(self, tab: Tab):
        """Initialize a new Request instance bound to a browser tab.

        Args:
            tab: The browser tab instance where requests will be executed.
                This tab provides the JavaScript execution context and maintains
                the browser's session state (cookies, authentication, etc.).
        """
        self.tab = tab
        self._network_events_enabled = False
        self._callback_ids: list[int] = []
        self._requests_sent: list[RequestSentEvent] = []
        self._requests_received: list[RequestReceivedEvent] = []
        logger.debug('Request helper initialized for tab')

    async def request(
        self,
        method: str,
        url: str,
        params: Optional[dict[str, str]] = None,
        data: Optional[Union[dict, list, tuple, str, bytes]] = None,
        json: Optional[dict[str, Any]] = None,
        headers: Optional[list[HeaderEntry]] = None,
        **kwargs,
    ) -> Response:
        """Execute an HTTP request in the browser's JavaScript context.

        This method uses the browser's fetch API to make requests, inheriting all
        browser session state including cookies, authentication, and security context.
        The request is executed as if made by the browser itself.

        Args:
            method: HTTP method (GET, POST, PUT, DELETE, etc.). Case insensitive.
            url: Target URL for the request. Can be relative or absolute.
            params: Query parameters to append to the URL. These are URL-encoded
                and merged with any existing query string in the URL.
            data: Request body data. Behavior depends on type:
                - dict/list/tuple: URL-encoded as form data (application/x-www-form-urlencoded)
                - str/bytes: Sent as-is with no Content-Type modification
                Mutually exclusive with 'json' parameter.
            json: Data to be JSON-serialized as request body. Automatically sets
                Content-Type to application/json. Mutually exclusive with 'data'.
            headers: Additional headers to include. These are ADDED to browser's
                automatic headers, not replacements.
                Format: [{'name': 'X-Custom', 'value': 'value'}]
            **kwargs: Additional fetch API options (e.g., credentials, mode, cache).

        Returns:
            Response object containing status, headers, content, and cookies from
            both the request and response phases.

        Raises:
            HTTPError: If the request execution fails or network error occurs.

        Note:
            - Browser cookies are automatically included
            - CORS policies are enforced by the browser
            - Authentication headers are preserved from browser session
        """
        final_url = self._build_url_with_params(url, params)
        options = self._build_request_options(method, headers, json, data, **kwargs)
        logger.info(f'Executing request: method={method.upper()}, url={final_url}')
        logger.debug(
            f'Executing request: method={method.upper()}, url={final_url}, '
            f'headers={bool(headers)}, json={json is not None}, data={data is not None}'
        )
        try:
            result = await self._execute_fetch_request(final_url, options)
            received_headers = self._extract_received_headers()
            sent_headers = self._extract_sent_headers()
            cookies = self._extract_set_cookies()
            return self._build_response(result, received_headers, sent_headers, cookies)

        except Exception as exc:
            logger.error(f'Request failed: {exc}')
            raise HTTPError(f'Request failed: {str(exc)}') from exc

        finally:
            await self._clear_callbacks()

    async def get(
        self,
        url: str,
        params: Optional[dict[str, str]] = None,
        **kwargs,
    ) -> Response:
        """Execute a GET request for retrieving data.

        Args:
            url: Target URL to retrieve data from.
            params: Query parameters to append to URL.
            **kwargs: Additional fetch options.

        Returns:
            Response object with retrieved data.
        """
        return await self.request('GET', url, params=params, **kwargs)

    async def post(
        self,
        url: str,
        data: Optional[Union[dict, list, tuple, str, bytes]] = None,
        json: Optional[dict[str, Any]] = None,
        **kwargs,
    ) -> Response:
        """Execute a POST request for creating or submitting data.

        Args:
            url: Target URL for data submission.
            data: Form data to submit (URL-encoded).
            json: JSON data to submit.
            **kwargs: Additional fetch options.

        Returns:
            Response object with server's response to the submission.
        """
        return await self.request('POST', url, data=data, json=json, **kwargs)

    async def put(
        self,
        url: str,
        data: Optional[Union[dict, list, tuple, str, bytes]] = None,
        json: Optional[dict[str, Any]] = None,
        **kwargs,
    ) -> Response:
        """Execute a PUT request for updating/replacing resources.

        Args:
            url: Target URL of resource to update.
            data: Form data for the update.
            json: JSON data for the update.
            **kwargs: Additional fetch options.

        Returns:
            Response object confirming the update operation.
        """
        return await self.request('PUT', url, data=data, json=json, **kwargs)

    async def patch(
        self,
        url: str,
        data: Optional[Union[dict, list, tuple, str, bytes]] = None,
        json: Optional[dict[str, Any]] = None,
        **kwargs,
    ) -> Response:
        """Execute a PATCH request for partial resource updates.

        Args:
            url: Target URL of resource to partially update.
            data: Form data with changes to apply.
            json: JSON data with changes to apply.
            **kwargs: Additional fetch options.

        Returns:
            Response object confirming the partial update.
        """
        return await self.request('PATCH', url, data=data, json=json, **kwargs)

    async def delete(self, url: str, **kwargs) -> Response:
        """Execute a DELETE request for removing resources.

        Args:
            url: Target URL of resource to delete.
            **kwargs: Additional fetch options.

        Returns:
            Response object confirming the deletion.
        """
        return await self.request('DELETE', url, **kwargs)

    async def head(self, url: str, **kwargs) -> Response:
        """Execute a HEAD request to retrieve only response headers.

        Useful for checking resource existence, size, or modification date
        without downloading the full content.

        Args:
            url: Target URL to check headers for.
            **kwargs: Additional fetch options.

        Returns:
            Response object with headers but no body content.
        """
        return await self.request('HEAD', url, **kwargs)

    async def options(self, url: str, **kwargs) -> Response:
        """Execute an OPTIONS request to check allowed methods and capabilities.

        Used for CORS preflight checks and discovering server capabilities.

        Args:
            url: Target URL to check options for.
            **kwargs: Additional fetch options.

        Returns:
            Response object with allowed methods and CORS headers.
        """
        return await self.request('OPTIONS', url, **kwargs)

    @asynccontextmanager
    async def record(
        self,
        resource_types: list[ResourceType] | None = None,
    ) -> AsyncIterator[HarCapture]:
        """Record network traffic as HAR.

        Context manager that captures all network activity on the tab
        and produces a HarCapture object for export.

        Args:
            resource_types: Optional list of resource types to capture.
                When provided, only requests matching these types are
                recorded. When None (default), all resource types are
                captured.

        Usage::

            async with tab.request.record() as capture:
                await tab.go_to('https://example.com')
            capture.save('flow.har')

            # Record only fetch and XHR requests
            async with tab.request.record(
                resource_types=[ResourceType.FETCH, ResourceType.XHR]
            ) as capture:
                await tab.go_to('https://example.com')
            capture.save('api_calls.har')

        Yields:
            HarCapture: Object with .save(), .to_dict(), and .entries.
        """
        recorder = HarRecorder(self.tab, resource_types=resource_types)
        capture = HarCapture(recorder)
        await recorder.start()
        try:
            yield capture
        finally:
            await recorder.stop()

    @staticmethod
    def _build_url_with_params(url: str, params: Optional[dict[str, str]]) -> str:
        """Build final URL with query parameters."""
        logger.debug(f'Building URL with params: url={url}, params={params}')
        if not params:
            return url

        parsed = urlparse(url)
        query = parse_qs(parsed.query)
        for key, value in params.items():
            query[key] = [value]

        return urlunparse(parsed._replace(query=urlencode(query, doseq=True)))

    def _build_request_options(
        self,
        method: str,
        headers: Optional[list[HeaderEntry]],
        json: Optional[dict[str, Any]],
        data: Optional[Union[dict, list, tuple, str, bytes]],
        **kwargs,
    ) -> dict[str, Any]:
        """Build request options dictionary."""
        headers_dict = self._convert_header_entries_to_dict(headers) if headers else {}
        options = {
            'method': method.upper(),
            'headers': headers_dict,
            **kwargs,
        }
        logger.debug(f'Building request options: options={options}')
        self._add_request_body(options, json, data)
        return options

    def _add_request_body(
        self,
        options: dict[str, Any],
        json: Optional[dict[str, Any]],
        data: Optional[Union[dict, list, tuple, str, bytes]],
    ) -> None:
        """Add request body and appropriate Content-Type header."""
        if json is not None:
            self._handle_json_options(options, json)
        elif data is not None:
            self._handle_data_options(options, data)

    @staticmethod
    def _handle_json_options(options: dict[str, Any], json: Optional[dict[str, Any]]) -> None:
        """Handle JSON options."""
        options['body'] = jsonlib.dumps(json)
        options['headers'].setdefault('Content-Type', 'application/json')
        logger.debug('Request JSON body set and content-type applied')

    @staticmethod
    def _handle_data_options(
        options: dict[str, Any], data: Optional[Union[dict, list, tuple, str, bytes]]
    ) -> None:
        """Handle data options."""
        if isinstance(data, (dict, list, tuple)):
            options['body'] = urlencode(data, doseq=True)
            options['headers'].setdefault('Content-Type', 'application/x-www-form-urlencoded')
            logger.debug('Request data encoded as form-urlencoded')
        else:
            options['body'] = data
            logger.debug('Request data set as raw payload')

    async def _execute_fetch_request(self, url: str, options: dict[str, Any]) -> EvaluateResponse:
        """Execute the fetch request using browser's runtime."""
        script = Scripts.MAKE_REQUEST.format(url=jsonlib.dumps(url), options=jsonlib.dumps(options))
        await self._register_callbacks()
        logger.debug('Registered network callbacks and executing fetch via Runtime.evaluate')

        return await self.tab._execute_command(
            RuntimeCommands.evaluate(
                expression=script,
                return_by_value=True,
                await_promise=True,
            )
        )

    @staticmethod
    def _build_response(
        result: EvaluateResponse,
        response_headers: list[HeaderEntry],
        request_headers: list[HeaderEntry],
        cookies: list[CookieParam],
    ) -> Response:
        """Build Response object from fetch result."""
        result_value = result['result']['result']['value']
        logger.debug(f'Building response: result_value={result_value}')
        return Response(
            status_code=result_value['status'],
            content=bytes(result_value.get('content', b'')),
            text=result_value['text'],
            json=result_value['json'],
            response_headers=response_headers,
            request_headers=request_headers,
            cookies=cookies,
            url=result_value['url'],
        )

    async def _register_callbacks(self) -> None:
        """Register network event listeners to capture request/response metadata.

        Sets up CDP event listeners to capture all network activity during the
        request execution. This includes both outgoing request data and incoming
        response data, which are used for header and cookie extraction.

        Note:
            Network events are only enabled if not already active on the tab.
        """
        if not self.tab.network_events_enabled:
            await self.tab.enable_network_events()
            self._network_events_enabled = True
            logger.debug('Network events enabled on tab for request capture')

        def append_received_request(event: dict) -> None:
            self._requests_received.append(cast(RequestReceivedEvent, event))
            logger.debug(f'Appended received request: event={event}')

        def append_sent_request(event: dict) -> None:
            self._requests_sent.append(cast(RequestSentEvent, event))
            logger.debug(f'Appended sent request: event={event}')

        self._callback_ids = [
            await self.tab.on(
                NetworkEvent.REQUEST_WILL_BE_SENT,
                callback=append_sent_request,
            ),
            await self.tab.on(
                NetworkEvent.REQUEST_WILL_BE_SENT_EXTRA_INFO,
                callback=append_sent_request,
            ),
            await self.tab.on(
                NetworkEvent.RESPONSE_RECEIVED,
                callback=append_received_request,
            ),
            await self.tab.on(
                NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO,
                callback=append_received_request,
            ),
        ]

    async def _clear_callbacks(self) -> None:
        """Clean up network event listeners and disable network monitoring.

        Removes only the callbacks registered by this request instance
        (surgical removal) so other listeners (e.g. HarRecorder) are
        not affected.
        """
        for callback_id in self._callback_ids:
            await self.tab.remove_callback(callback_id)
        self._callback_ids.clear()
        if self._network_events_enabled:
            await self.tab.disable_network_events()
            self._network_events_enabled = False
            logger.debug('Network events disabled on tab after request')

    def _extract_received_headers(self) -> list[HeaderEntry]:
        """Extract headers from response network events.

        Returns:
            List of headers received from the server during response.
        """
        event_extractors: dict[str, Callable[[Any], list[HeaderEntry]]] = {
            'response': self._extract_response_received_headers,
            'blockedCookies': self._extract_response_received_extra_info_headers,
        }

        return self._extract_headers_from_events(self._requests_received, event_extractors)

    def _extract_sent_headers(self) -> list[HeaderEntry]:
        """Extract headers from request network events.

        Returns:
            List of headers that were actually sent in the request.
        """
        event_extractors: dict[str, Callable[[Any], list[HeaderEntry]]] = {
            'request': self._extract_request_sent_headers,
            'associatedCookies': self._extract_request_sent_extra_info_headers,
        }

        return self._extract_headers_from_events(self._requests_sent, event_extractors)

    @staticmethod
    def _extract_headers_from_events(
        events: Union[list[RequestSentEvent], list[RequestReceivedEvent]],
        event_extractors: dict[str, Callable[[Any], list[HeaderEntry]]],
    ) -> list[HeaderEntry]:
        """Extract headers from network events using appropriate extractors.

        Args:
            events: List of network events to process.
            event_extractors: Mapping of event keys to header extraction functions.

        Returns:
            Deduplicated list of headers from all matching events.

        Note:
            Headers are deduplicated based on name-value pairs to avoid
            duplicate entries from multiple event types.
        """
        headers: list[HeaderEntry] = []
        seen = set()
        logger.debug(f'Extracting headers from events: events={events}')
        for event in events:
            params = event['params']
            for key, extractor in event_extractors.items():
                if key in params:
                    extracted_headers = extractor(params)
                    logger.debug(f'Extracted headers: extracted_headers={extracted_headers}')
                    for header in extracted_headers:
                        identity = (header['name'], header['value'])
                        logger.debug(f'Identity: identity={identity}')
                        if identity not in seen:
                            headers.append(header)
                            seen.add(identity)
                            logger.debug(f'Added header: header={header}')
                    break

        logger.debug(f'Headers extracted: headers={headers}')
        return headers

    def _extract_request_sent_headers(
        self, params: RequestWillBeSentEventParams
    ) -> list[HeaderEntry]:
        """Extract headers from main request event.

        Args:
            params: Event parameters containing request details.

        Returns:
            List of headers that were sent with the request.
        """
        request = params['request']
        logger.debug(f'Extracting request sent headers: request={request}')
        return self._convert_dict_to_header_entries(request.get('headers', {}))

    def _extract_request_sent_extra_info_headers(
        self, params: RequestWillBeSentExtraInfoEventParams
    ) -> list[HeaderEntry]:
        """Extract headers from extra request info event.

        This event contains additional header information that may not be
        present in the main request event, such as security-related headers.

        Args:
            params: Extra info event parameters containing additional headers.

        Returns:
            List of additional headers sent with the request.
        """
        logger.debug(f'Extracting request sent extra info headers: params={params}')
        return self._convert_dict_to_header_entries(params.get('headers', {}))

    def _extract_response_received_headers(
        self, params: ResponseReceivedEventParams
    ) -> list[HeaderEntry]:
        """Extract headers from main response event.

        Args:
            params: Event parameters containing response details.

        Returns:
            List of headers received from the server.
        """
        response = params['response']
        logger.debug(f'Extracting response received headers: response={response}')
        return self._convert_dict_to_header_entries(response.get('headers', {}))

    def _extract_response_received_extra_info_headers(
        self, params: ResponseReceivedExtraInfoEventParams
    ) -> list[HeaderEntry]:
        """Extract headers from extra response info event.

        This event contains additional response header information, including
        Set-Cookie headers and security-related headers that may be filtered
        from the main response event.

        Args:
            params: Extra info event parameters containing additional headers.

        Returns:
            List of additional headers received from the server.
        """
        logger.debug(f'Extracting response received extra info headers: params={params}')
        return self._convert_dict_to_header_entries(params.get('headers', {}))

    @staticmethod
    def _convert_dict_to_header_entries(headers_dict: dict) -> list[HeaderEntry]:
        """Convert header dictionary to standardized HeaderEntry format.

        Args:
            headers_dict: Dictionary mapping header names to values.

        Returns:
            List of HeaderEntry objects with 'name' and 'value' keys.
        """
        logger.debug(f'Converting dictionary to header entries: headers_dict={headers_dict}')
        return [HeaderEntry(name=name, value=value) for name, value in headers_dict.items()]

    def _extract_set_cookies(self) -> list[CookieParam]:
        """Extract and parse all Set-Cookie headers from response events.

        Processes response events to find Set-Cookie headers and converts them
        into structured cookie objects. Handles multiple Set-Cookie headers
        and multi-line cookie declarations.

        Returns:
            List of unique cookies extracted from Set-Cookie headers.
        """
        cookies: list[CookieParam] = []
        logger.debug(f'Extracting set cookies: cookies={cookies}')
        response_extra_info_events = self._filter_response_extra_info_events()
        logger.debug(
            f'Filtering response extra info events: '
            f'response_extra_info_events={response_extra_info_events}'
        )
        for event in response_extra_info_events:
            params = cast(ResponseReceivedExtraInfoEventParams, event['params'])
            headers = self._convert_dict_to_header_entries(params['headers'])
            logger.debug(f'Converting dictionary to header entries: headers={headers}')
            set_cookie_headers = [
                header['value'] for header in headers if header['name'] == 'Set-Cookie'
            ]
            logger.debug(f'Set cookie headers: set_cookie_headers={set_cookie_headers}')
            if set_cookie_headers:
                for set_cookie_header in set_cookie_headers:
                    self._add_unique_cookies(
                        cookies, self._parse_set_cookie_header(set_cookie_header)
                    )
        logger.debug(f'Set cookies extracted: cookies={cookies}')
        return cookies

    def _filter_response_extra_info_events(self) -> list[RequestReceivedEvent]:
        """Filter network events to find those containing Set-Cookie information.

        Returns:
            List of events that contain extra response information including cookies.
        """
        logger.debug(
            f'Filtering response extra info events: requests_received={self._requests_received}'
        )
        return [
            event
            for event in self._requests_received
            if event['method'] == NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO
        ]

    def _parse_set_cookie_header(self, set_cookie_header: str) -> list[CookieParam]:
        """Parse a Set-Cookie header value into individual cookie objects.

        Handles both single and multi-line Set-Cookie headers, extracting
        cookie name-value pairs while ignoring attributes like Path, Domain, etc.

        Args:
            set_cookie_header: Raw Set-Cookie header value from HTTP response.

        Returns:
            List of parsed cookie objects with name and value.
        """
        cookies = []
        lines = set_cookie_header.split('\n')
        logger.debug(f'Parsing set cookie header: set_cookie_header={set_cookie_header}')
        for line in lines:
            cookie = self._parse_cookie_line(line)
            if cookie:
                logger.debug(f'Parsed cookie: cookie={cookie}')
                cookies.append(cookie)
        logger.debug(f'Parsed cookies: cookies={cookies}')
        return cookies

    @staticmethod
    def _parse_cookie_line(line: str) -> Optional[CookieParam]:
        """Parse a single cookie line to extract name and value.

        Extracts only the cookie name and value, ignoring all cookie attributes
        like Path, Domain, Secure, HttpOnly, etc. Rejects cookies with empty names.

        Args:
            line: Single line from Set-Cookie header.

        Returns:
            CookieParam object with name and value, or None if parsing fails or name is empty.
        """
        if '=' not in line:
            return None

        name = line.split('=', 1)[0].strip()
        value = line.split('=', 1)[1].split(';', 1)[0].strip()

        # Reject cookies with empty names
        if not name:
            return None

        return CookieParam(name=name, value=value)

    @staticmethod
    def _add_unique_cookies(cookies: list[CookieParam], new_cookies: list[CookieParam]) -> None:
        """Add cookies to list while avoiding duplicates.

        Args:
            cookies: Existing list of cookies to add to.
            new_cookies: New cookies to add if not already present.
        """
        logger.debug(f'Adding unique cookies: cookies={cookies}, new_cookies={new_cookies}')
        for cookie in new_cookies:
            if cookie not in cookies:
                cookies.append(cookie)
                logger.debug(f'Added unique cookie: cookie={cookie}')
        logger.debug(f'Unique cookies added: cookies={cookies}')

    @staticmethod
    def _convert_header_entries_to_dict(headers: list[HeaderEntry]) -> dict[str, str]:
        """Convert HeaderEntry objects to a plain dictionary format.

        Used for preparing headers for the JavaScript fetch API which expects
        a simple object mapping header names to values.

        Args:
            headers: List of HeaderEntry objects with 'name' and 'value' keys.

        Returns:
            Dictionary mapping header names to values.
        """
        logger.debug(f'Converting header entries to dictionary: headers={headers}')
        return {header['name']: header['value'] for header in headers}


================================================
FILE: pydoll/browser/requests/response.py
================================================
from __future__ import annotations

import json as jsonlib
import logging
from typing import TYPE_CHECKING, Any, Optional, Union

from pydoll.exceptions import HTTPError

if TYPE_CHECKING:
    from pydoll.protocol.fetch.types import HeaderEntry
    from pydoll.protocol.network.types import CookieParam

logger = logging.getLogger(__name__)

STATUS_CODE_RANGE_OK = range(200, 400)


class Response:
    """HTTP response object for browser-based fetch requests.

    This class provides a standardized interface for handling HTTP responses
    obtained through the browser's fetch API. It mimics the requests.Response
    interface while preserving all browser-specific metadata including cookies,
    headers, and network timing information.

    Key Features:
    - Compatible with requests.Response API for easy migration
    - Preserves both request and response headers for analysis
    - Automatic cookie extraction from Set-Cookie headers
    - Lazy JSON parsing with caching
    - Browser-context aware (respects CORS, security policies)
    - Content available in multiple formats (text, bytes, JSON)

    The response contains all data captured during the browser's fetch execution,
    including redirects, authentication flows, and any browser-applied transformations.
    """

    def __init__(
        self,
        status_code: int,
        content: bytes = b'',
        text: str = '',
        json: Optional[dict[str, Any]] = None,
        response_headers: Optional[list[HeaderEntry]] = None,
        request_headers: Optional[list[HeaderEntry]] = None,
        cookies: Optional[list[CookieParam]] = None,
        url: str = '',
    ):
        """Initialize a new Response instance with browser fetch results.

        Args:
            status_code: HTTP status code returned by the server (e.g., 200, 404, 500).
            content: Raw response body as bytes. Used for binary data or when
                text encoding is uncertain.
            text: Response body as decoded string. Pre-decoded by browser's fetch API.
            json: Pre-parsed JSON data if response Content-Type was application/json.
                If None, json() method will attempt to parse from text on demand.
            response_headers: Headers received from the server, including Set-Cookie,
                Content-Type, and any custom headers sent by the server.
            request_headers: Headers that were actually sent in the request, including
                browser-generated headers (User-Agent, Accept, etc.) and custom headers.
            cookies: Cookies extracted from Set-Cookie headers during the response.
                These represent new/updated cookies from this specific request.
            url: Final URL after any redirects. May differ from original request URL
                if the server performed redirects during the request.
        """
        self._status_code = status_code
        self._content = content
        self._text = text
        self._json = json
        self._response_headers = response_headers or []
        self._request_headers = request_headers or []
        self._cookies = cookies or []
        self._url = url
        self._ok = status_code in STATUS_CODE_RANGE_OK
        logger.debug(
            f'Response initialized: status={status_code}, url={url}, '
            f'headers={len(self._response_headers)}, cookies={len(self._cookies)}'
        )

    @property
    def ok(self) -> bool:
        """Check if the request was successful (2xx status codes).

        Returns:
            True if status code is in the 200-399 range, False otherwise.

        Note:
            This follows HTTP conventions where 2xx codes indicate success
            and 3xx codes indicate redirection (still considered "ok").
        """
        return self._ok

    @property
    def cookies(self) -> list[CookieParam]:
        """Get cookies that were set by the server during this response.

        Returns:
            List of cookies extracted from Set-Cookie headers. Each cookie
            contains name and value, with cookie attributes (Path, Domain, etc.)
            automatically handled by the browser.

        Note:
            These are only NEW/UPDATED cookies from this response. Existing
            browser cookies are managed automatically by the browser context.
        """
        return self._cookies

    @property
    def request_headers(self) -> list[HeaderEntry]:
        """Get headers that were actually sent in the HTTP request.

        Returns:
            List of headers sent to the server, including both custom headers
            provided by the user and automatic headers added by the browser
            (User-Agent, Accept, Authorization, etc.).

        Note:
            This shows the ACTUAL headers sent, which may differ from what
            was originally specified due to browser modifications.
        """
        return self._request_headers

    @property
    def headers(self) -> list[HeaderEntry]:
        """Get headers received from the server in the HTTP response.

        Returns:
            List of response headers sent by the server, including standard
            headers (Content-Type, Content-Length, etc.) and any custom headers.

        Note:
            Some security-sensitive headers may be filtered by the browser
            and not appear in this list due to CORS policies.
        """
        return self._response_headers

    @property
    def status_code(self) -> int:
        """Get the HTTP status code returned by the server.

        Returns:
            Integer status code (e.g., 200 for OK, 404 for Not Found, 500 for Server Error).
        """
        return self._status_code

    @property
    def text(self) -> str:
        """Get the response content as a decoded string.

        Returns:
            Response body decoded as UTF-8 string. If no text was provided
            during initialization, it will be decoded from the raw content.

        Note:
            Decoding uses 'replace' error handling to avoid crashes on
            invalid UTF-8 sequences.
        """
        if not self._text and self.content:
            self._text = self.content.decode('utf-8', errors='replace')
        return self._text

    @property
    def content(self) -> bytes:
        """Get the raw response content as bytes.

        Returns:
            Unmodified response body as bytes. Useful for binary data
            (images, files, etc.) or when you need to handle encoding manually.
        """
        return self._content

    @property
    def url(self) -> str:
        """Get the final URL of the response after any redirects.

        Returns:
            The final URL that was accessed, which may differ from the
            original request URL if redirects occurred.
        """
        return self._url

    def json(self) -> Union[dict[str, Any], list]:
        """Parse and return the response content as JSON data.

        Attempts to parse the response text as JSON. Uses caching to avoid
        re-parsing the same content multiple times.

        Returns:
            Parsed JSON data as dictionary, list, or other JSON-compatible type.

        Raises:
            ValueError: If the response content is not valid JSON or if parsing fails.

        Note:
            - Uses lazy parsing: JSON is only parsed when first accessed
            - Subsequent calls return cached result for better performance
            - If JSON was pre-parsed during initialization, that result is returned
        """
        if self._json is not None:
            return self._json

        try:
            self._json = jsonlib.loads(self.text)
            return self._json
        except jsonlib.JSONDecodeError as exc:
            logger.debug('Failed to decode response as JSON')
            raise ValueError('Response is not valid JSON') from exc

    def raise_for_status(self) -> None:
        """Raise an HTTPError if the response indicates an HTTP error status.

        Checks the status code and raises an exception for client errors (4xx)
        and server errors (5xx). Successful responses (2xx) and redirects (3xx)
        do not raise an exception.

        Raises:
            HTTPError: If status code is 400 or higher, indicating an error.

        Note:
            This method is compatible with requests.Response.raise_for_status()
            for easy migration from the requests library.
        """
        if self.status_code not in STATUS_CODE_RANGE_OK:
            logger.error(
                f'HTTP error status encountered: status={self.status_code}, url={self._url}'
            )
            raise HTTPError(f'{self.status_code} Client Error: for url {self._url}')


================================================
FILE: pydoll/browser/tab.py
================================================
from __future__ import annotations

import asyncio
import base64 as _b64
import contextlib
import io
import logging
import shutil
import warnings
import zipfile
from contextlib import asynccontextmanager
from functools import partial
from pathlib import Path
from tempfile import mkdtemp
from typing import (
    TYPE_CHECKING,
    Any,
    AsyncGenerator,
    Awaitable,
    Callable,
    Optional,
    TypeAlias,
    Union,
    cast,
    overload,
)

import aiofiles

from pydoll.browser.requests import Request
from pydoll.commands import (
    DomCommands,
    FetchCommands,
    NetworkCommands,
    PageCommands,
    RuntimeCommands,
    StorageCommands,
    TargetCommands,
)
from pydoll.connection import ConnectionHandler
from pydoll.constants import By, PageLoadState
from pydoll.elements.mixins import FindElementsMixin
from pydoll.elements.shadow_root import ShadowRoot
from pydoll.elements.web_element import WebElement
from pydoll.exceptions import (
    CommandExecutionTimeout,
    DownloadTimeout,
    IFrameNotFound,
    InvalidFileExtension,
    InvalidIFrame,
    InvalidScriptWithElement,
    InvalidTabInitialization,
    MissingScreenshotPath,
    NetworkEventsNotEnabled,
    NoDialogPresent,
    NotAnIFrame,
    PageLoadTimeout,
    TopLevelTargetRequired,
    WaitElementTimeout,
    WebSocketConnectionClosed,
)
from pydoll.interactions import KeyboardAPI, MouseAPI, ScrollAPI
from pydoll.interactions.iframe import IFrameContext
from pydoll.protocol.browser.types import DownloadBehavior, DownloadProgressState
from pydoll.protocol.dom.types import Node, ShadowRootType
from pydoll.protocol.network.types import ResourceType
from pydoll.protocol.page.events import PageEvent
from pydoll.protocol.page.types import FrameResourceTree, ScreenshotFormat
from pydoll.protocol.runtime.methods import (
    CallFunctionOnResponse,
    EvaluateResponse,
    SerializationOptions,
)
from pydoll.protocol.runtime.types import CallArgument
from pydoll.protocol.target.types import TargetInfo
from pydoll.utils import (
    decode_base64_to_bytes,
    has_return_outside_function,
)
from pydoll.utils.bundle import (
    build_asset_filename,
    collect_frame_resources,
    filter_fetchable_resources,
    inline_all_assets,
    rewrite_html_urls,
)

if TYPE_CHECKING:
    from pydoll.browser.chromium.base import Browser
    from pydoll.protocol.base import EmptyResponse, Response
    from pydoll.protocol.browser.events import (
        DownloadProgressEvent,
        DownloadWillBeginEvent,
    )
    from pydoll.protocol.dom.methods import (
        DescribeNodeResponse,
        GetDocumentResponse,
        ResolveNodeResponse,
    )
    from pydoll.protocol.fetch.types import AuthChallengeResponseType, HeaderEntry, RequestStage
    from pydoll.protocol.network.events import RequestWillBeSentEvent
    from pydoll.protocol.network.methods import GetCookiesResponse as NetworkGetCookiesResponse
    from pydoll.protocol.network.methods import GetResponseBodyResponse
    from pydoll.protocol.network.types import (
        Cookie,
        CookieParam,
        ErrorReason,
        RequestMethod,
    )
    from pydoll.protocol.page.events import FileChooserOpenedEvent
    from pydoll.protocol.page.methods import (
        CaptureScreenshotResponse,
        GetResourceContentResponse,
        GetResourceTreeResponse,
        PrintToPDFResponse,
    )
    from pydoll.protocol.runtime.methods import CallFunctionOnResponse, EvaluateResponse
    from pydoll.protocol.storage.methods import GetCookiesResponse as StorageGetCookiesResponse
    from pydoll.protocol.target.methods import AttachToTargetResponse, GetTargetsResponse

logger = logging.getLogger(__name__)

IFrame: TypeAlias = 'Tab'

_CLOUDFLARE_CHALLENGE_DOMAIN = 'challenges.cloudflare.com'
_CLOUDFLARE_IFRAME_SELECTOR = f'iframe[src*="{_CLOUDFLARE_CHALLENGE_DOMAIN}"]'
_CLOUDFLARE_CHECKBOX_SELECTOR = 'span.cb-i'


class Tab(FindElementsMixin):
    """
    Controls a browser tab via Chrome DevTools Protocol.

    Primary interface for web page automation including navigation, DOM manipulation,
    JavaScript execution, event handling, network monitoring, and specialized tasks
    like Cloudflare bypass.
    """

    def __init__(
        self,
        browser: Browser,
        connection_port: Optional[int] = None,
        target_id: Optional[str] = None,
        browser_context_id: Optional[str] = None,
        ws_address: Optional[str] = None,
    ):
        """
        Initialize tab controller for existing browser tab.

        Args:
            browser: Browser instance that created this tab.
            connection_port: CDP WebSocket port.
            target_id: CDP target identifier for this tab.
            browser_context_id: Optional browser context ID.
            ws_address: Optional WebSocket address for this tab.
        """
        if not any([connection_port, target_id, ws_address]):
            raise InvalidTabInitialization()

        self._browser = browser
        self._connection_port = connection_port
        self._target_id = target_id
        self._ws_address = ws_address
        self._browser_context_id = browser_context_id
        self._connection_handler = self._get_connection_handler()
        self._page_events_enabled = False
        self._network_events_enabled = False
        self._fetch_events_enabled = False
        self._dom_events_enabled = False
        self._runtime_events_enabled = False
        self._intercept_file_chooser_dialog_enabled = False
        self._cloudflare_captcha_callback_id: Optional[int] = None
        self._request: Optional[Request] = None
        self._scroll: Optional[ScrollAPI] = None
        self._keyboard: Optional[KeyboardAPI] = None
        self._mouse: MouseAPI = MouseAPI(self)
        logger.debug(
            (
                f'Tab initialized: target_id={self._target_id}, '
                f'ws_address_set={bool(self._ws_address)}, '
                f'context_id={self._browser_context_id}, port={self._connection_port}'
            )
        )

    @property
    def page_events_enabled(self) -> bool:
        """Whether CDP Page domain events are enabled."""
        return self._page_events_enabled

    @property
    def network_events_enabled(self) -> bool:
        """Whether CDP Network domain events are enabled."""
        return self._network_events_enabled

    @property
    def fetch_events_enabled(self) -> bool:
        """Whether CDP Fetch domain events (request interception) are enabled."""
        return self._fetch_events_enabled

    @property
    def dom_events_enabled(self) -> bool:
        """Whether CDP DOM domain events are enabled."""
        return self._dom_events_enabled

    @property
    def runtime_events_enabled(self) -> bool:
        """Whether CDP Runtime domain events are enabled."""
        return self._runtime_events_enabled

    @property
    def request(self) -> Request:
        """
        Get the request object for making HTTP requests using the browser's fetch API.

        Returns:
            Request: An instance of the Request class for making HTTP requests.
        """
        if self._request is None:
            self._request = Request(self)
        return self._request

    @property
    def scroll(self) -> ScrollAPI:
        """
        Get the scroll API for controlling page scroll behavior.

        Returns:
            ScrollAPI: An instance of the ScrollAPI class for scroll operations.
        """
        if self._scroll is None:
            self._scroll = ScrollAPI(self)
        return self._scroll

    @property
    def keyboard(self) -> KeyboardAPI:
        """
        Get the keyboard API for controlling keyboard input at page level.

        Returns:
            KeyboardAPI: An instance of the KeyboardAPI class for keyboard operations.
        """
        if self._keyboard is None:
            self._keyboard = KeyboardAPI(self)
        return self._keyboard

    @property
    def mouse(self) -> MouseAPI:
        """
        Get the mouse API for controlling mouse input.

        Returns:
            MouseAPI: An instance of the MouseAPI class for mouse operations.
        """
        return self._mouse

    @property
    def intercept_file_chooser_dialog_enabled(self) -> bool:
        """Whether file chooser dialog interception is active."""
        return self._intercept_file_chooser_dialog_enabled

    @property
    async def current_url(self) -> str:
        """Get current page URL (reflects redirects and client-side navigation)."""
        response: EvaluateResponse = await self._execute_command(
            RuntimeCommands.evaluate('window.location.href')
        )
        return response['result']['result']['value']

    @property
    async def page_source(self) -> str:
        """Get complete HTML source of current page (live DOM state)."""
        response: EvaluateResponse = await self._execute_command(
            RuntimeCommands.evaluate('document.documentElement.outerHTML')
        )
        return response['result']['result']['value']

    @property
    async def title(self) -> str:
        """Get current page title."""
        response: EvaluateResponse = await self._execute_command(
            RuntimeCommands.evaluate('document.title')
        )
        return response['result']['result'].get('value', '')

    async def enable_page_events(self):
        """Enable CDP Page domain events (load, navigation, dialogs, etc.)."""
        logger.debug('Enabling Page events')
        response = await self._execute_command(PageCommands.enable())
        self._page_events_enabled = True
        logger.debug('Page events enabled')
        return response

    async def enable_network_events(self):
        """Enable CDP Network domain events (requests, responses, etc.)."""
        logger.debug('Enabling Network events')
        response = await self._execute_command(NetworkCommands.enable())
        self._network_events_enabled = True
        logger.debug('Network events enabled')
        return response

    async def enable_fetch_events(
        self,
        handle_auth: bool = False,
        resource_type: Optional[ResourceType] = None,
        request_stage: Optional[RequestStage] = None,
    ):
        """
        Enable CDP Fetch domain for request interception.

        Args:
            handle_auth: Intercept authentication challenges.
            resource_type: Filter by resource type (all if None).
            request_stage: When to intercept (Request/Response).

        Note:
            Intercepted requests must be explicitly continued or timeout.
        """
        logger.debug(
            f'Enabling Fetch events: handle_auth={handle_auth}, resource_type={resource_type}, '
            f'stage={request_stage}'
        )
        response: Response[EmptyResponse] = await self._execute_command(
            FetchCommands.enable(
                handle_auth_requests=handle_auth,
                resource_type=resource_type,
                request_stage=request_stage,
            )
        )
        self._fetch_events_enabled = True
        logger.debug('Fetch events enabled')
        return response

    async def enable_dom_events(self):
        """Enable CDP DOM domain events (document structure changes)."""
        logger.debug('Enabling DOM events')
        response = await self._execute_command(DomCommands.enable())
        self._dom_events_enabled = True
        logger.debug('DOM events enabled')
        return response

    async def enable_runtime_events(self):
        """Enable CDP Runtime domain events."""
        logger.debug('Enabling Runtime events')
        response = await self._execute_command(RuntimeCommands.enable())
        self._runtime_events_enabled = True
        logger.debug('Runtime events enabled')
        return response

    async def enable_intercept_file_chooser_dialog(self):
        """
        Enable file chooser dialog interception for automated uploads.

        Note:
            Use expect_file_chooser context manager for convenience.
        """
        logger.info('Enabling file chooser interception')
        response = await self._execute_command(PageCommands.set_intercept_file_chooser_dialog(True))
        self._intercept_file_chooser_dialog_enabled = True
        logger.debug('File chooser interception enabled')
        return response

    async def enable_auto_solve_cloudflare_captcha(
        self,
        custom_selector: Optional[tuple[By, str]] = None,
        time_before_click: Optional[float] = None,
        time_to_wait_captcha: float = 5,
    ):
        """
        Enable automatic Cloudflare Turnstile captcha bypass.

        Args:
            custom_selector: Deprecated — ignored. Cloudflare Turnstile is now
                detected automatically via shadow root inspection.
            time_before_click: Deprecated — ignored. The checkbox is now
                located via shadow root polling and clicked immediately.
            time_to_wait_captcha: Timeout for captcha detection (default 5s).
        """
        if custom_selector is not None:
            warnings.warn(
                'custom_selector is deprecated and ignored. Cloudflare Turnstile is now '
                'detected automatically via shadow root inspection.',
                DeprecationWarning,
                stacklevel=2,
            )

        if time_before_click is not None:
            warnings.warn(
                'time_before_click is deprecated and ignored. The checkbox is now '
                'located via shadow root polling and clicked immediately.',
                DeprecationWarning,
                stacklevel=2,
            )

        logger.info('Enabling Cloudflare captcha auto-solve')
        if not self.page_events_enabled:
            await self.enable_page_events()

        callback = partial(
            self._bypass_cloudflare,
            time_to_wait_captcha=time_to_wait_captcha,
        )

        self._cloudflare_captcha_callback_id = await self.on(PageEvent.LOAD_EVENT_FIRED, callback)
        logger.debug(
            f'Cloudflare auto-solve callback registered: id={self._cloudflare_captcha_callback_id}'
        )

    async def disable_fetch_events(self):
        """Disable CDP Fetch domain and release paused requests."""
        logger.debug('Disabling Fetch events')
        response = await self._execute_command(FetchCommands.disable())
        self._fetch_events_enabled = False
        logger.debug('Fetch events disabled')
        return response

    async def disable_page_events(self):
        """Disable CDP Page domain events."""
        logger.debug('Disabling Page events')
        response = await self._execute_command(PageCommands.disable())
        self._page_events_enabled = False
        logger.debug('Page events disabled')
        return response

    async def disable_network_events(self):
        """Disable CDP Network domain events."""
        logger.debug('Disabling Network events')
        response = await self._execute_command(NetworkCommands.disable())
        self._network_events_enabled = False
        logger.debug('Network events disabled')
        return response

    async def disable_dom_events(self):
        """Disable CDP DOM domain events."""
        logger.debug('Disabling DOM events')
        response = await self._execute_command(DomCommands.disable())
        self._dom_events_enabled = False
        logger.debug('DOM events disabled')
        return response

    async def disable_runtime_events(self):
        """Disable CDP Runtime domain events."""
        logger.debug('Disabling Runtime events')
        response = await self._execute_command(RuntimeCommands.disable())
        self._runtime_events_enabled = False
        logger.debug('Runtime events disabled')
        return response

    async def disable_intercept_file_chooser_dialog(self):
        """Disable file chooser dialog interception."""
        logger.info('Disabling file chooser interception')
        response = await self._execute_command(
            PageCommands.set_intercept_file_chooser_dialog(False)
        )
        self._intercept_file_chooser_dialog_enabled = False
        logger.debug('File chooser interception disabled')
        return response

    async def disable_auto_solve_cloudflare_captcha(self):
        """Disable automatic Cloudflare Turnstile captcha bypass."""
        logger.info('Disabling Cloudflare captcha auto-solve')
        await self._connection_handler.remove_callback(self._cloudflare_captcha_callback_id)
        self._cloudflare_captcha_callback_id = None

    async def close(self):
        """
        Close this browser tab.

        Note:
            Tab instance becomes invalid after calling this method.
        """
        logger.info(f'Closing tab: target_id={self._target_id}')
        result = await self._execute_command(PageCommands.close())
        self._browser._tabs_opened.pop(self._target_id)
        logger.debug('Tab closed and removed from browser registry')
        return result

    async def get_frame(self, frame: 'WebElement') -> IFrame:
        """
        .. deprecated:: ?.?.?
            Use iframe `WebElement` instances directly; this method will be removed in
            a future version.

        Get Tab object for interacting with iframe content.

        Args:
            frame: Tab representing the iframe tag.

        Returns:
            Tab instance configured for iframe interaction.

        Raises:
            NotAnIFrame: If element is not an iframe.
            InvalidIFrame: If iframe lacks valid src attribute.
            IFrameNotFound: If iframe target not found in browser.
        """
        warnings.warn(
            'Tab.get_frame() is deprecated and will be removed in a future version. '
            'Interact with iframe WebElements directly.',
            DeprecationWarning,
            stacklevel=2,
        )
        logger.debug(f'Resolving iframe: tag={frame.tag_name}')
        if not frame.tag_name == 'iframe':
            raise NotAnIFrame

        frame_url = frame.get_attribute('src')
        logger.debug(f'Iframe src resolved: {frame_url}')
        if not frame_url:
            raise InvalidIFrame('The iframe does not have a valid src attribute')

        targets = await self._browser.get_targets()
        iframe_target = next((target for target in targets if target['url'] == frame_url), None)
        if not iframe_target:
            raise IFrameNotFound('The target for the iframe was not found')

        target_id = iframe_target['targetId']
        if target_id in self._browser._tabs_opened:
            logger.debug(f'Iframe tab already tracked: {target_id}')
            return self._browser._tabs_opened[target_id]

        tab = Tab(
            self._browser,
            target_id=target_id,
            connection_port=self._connection_port,
        )
        self._browser._tabs_opened[target_id] = tab
        logger.debug(f'Iframe tab created and registered: {target_id}')
        return tab

    async def find_shadow_roots(self, deep: bool = False, timeout: float = 0) -> list[ShadowRoot]:
        """
        Find all shadow roots in the page.

        Traverses the entire DOM tree (including iframes and nested shadow DOMs)
        to collect all shadow roots found. This is especially useful when the
        shadow host element selector is unknown or dynamic (e.g., Cloudflare
        challenge pages).

        Args:
            deep: If True, also traverses cross-origin iframes (OOPIFs) to
                discover shadow roots inside them. The returned ShadowRoot
                objects will automatically route CDP commands through the
                correct OOPIF session.
            timeout: Maximum seconds to wait for shadow roots to appear.
                When > 0, repeatedly polls the DOM (every 0.5s) until at least
                one shadow root is found or the timeout expires. Useful when
                shadow hosts are injected asynchronously (e.g., Cloudflare
                Turnstile loading inside an OOPIF).

        Returns:
            List of ShadowRoot instances found in the page.

        Raises:
            WaitElementTimeout: If timeout > 0 and no shadow roots are found
                within the specified duration.
        """
        logger.debug('Finding all shadow roots in page (timeout=%s)', timeout)

        if not timeout:
            return await self._collect_all_shadow_roots(deep)

        start_time = asyncio.get_event_loop().time()
        while True:
            shadow_roots = await self._collect_all_shadow_roots(deep)
            if shadow_roots:
                return shadow_roots

            if asyncio.get_event_loop().time() - start_time > timeout:
                raise WaitElementTimeout(
                    f'Timed out after {timeout}s waiting for shadow roots in page'
                )

            await asyncio.sleep(0.5)

    async def _collect_all_shadow_roots(self, deep: bool) -> list[ShadowRoot]:
        """Collect shadow roots from the main document and optionally OOPIFs."""
        response: GetDocumentResponse = await self._execute_command(
            DomCommands.get_document(depth=-1, pierce=True)
        )
        root_node = response.get('result', {}).get('root', {})

        shadow_root_entries: list[tuple[Node, int | None]] = []
        self._collect_shadow_roots_from_tree(root_node, shadow_root_entries)

        shadow_roots: list[ShadowRoot] = []
        for shadow_data, host_backend_id in shadow_root_entries:
            backend_node_id = shadow_data.get('backendNodeId')
            if not backend_node_id:
                continue

            try:
                resolve_response: ResolveNodeResponse = await self._execute_command(
                    DomCommands.resolve_node(backend_node_id=backend_node_id)
                )
                shadow_object_id = resolve_response['result']['object']['objectId']
            except (CommandExecutionTimeout, WebSocketConnectionClosed, KeyError):
                logger.debug(f'Failed to resolve shadow root: backend_node_id={backend_node_id}')
                continue

            try:
                host_element = await self._resolve_shadow_host(host_backend_id)
            except (CommandExecutionTimeout, WebSocketConnectionClosed, KeyError):
                logger.debug(f'Failed to resolve shadow host: backend_node_id={host_backend_id}')
                host_element = None
            mode = ShadowRootType(shadow_data.get('shadowRootType', 'open'))
            shadow_roots.append(
                ShadowRoot(
                    object_id=shadow_object_id,
                    connection_handler=self._connection_handler,
                    mode=mode,
                    host_element=host_element,
                )
            )

        if deep:
            oopif_roots = await self._collect_oopif_shadow_roots()
            shadow_roots.extend(oopif_roots)

        logger.debug(f'Found {len(shadow_roots)} shadow roots')
        return shadow_roots

    async def _resolve_shadow_host(self, host_backend_id: int | None) -> WebElement | None:
        """Resolve the host element for a shadow root (best-effort)."""
        if not host_backend_id:
            return None

        host_response: ResolveNodeResponse = await self._execute_command(
            DomCommands.resolve_node(backend_node_id=host_backend_id)
        )
        host_object_id = host_response['result']['object']['objectId']
        host_attrs = await self._get_object_attributes(object_id=host_object_id)
        return WebElement(
            host_object_id, self._connection_handler, attributes_list=host_attrs, mouse=self._mouse
        )

    async def _collect_oopif_shadow_roots(self) -> list[ShadowRoot]:
        """Discover shadow roots inside cross-origin iframes (OOPIFs)."""
        browser_handler = ConnectionHandler(connection_port=self._connection_port)
        targets_response: GetTargetsResponse = await browser_handler.execute_command(
            TargetCommands.get_targets()
        )

        target_infos = targets_response.get('result', {}).get('targetInfos', [])
        iframe_targets = [t for t in target_infos if t.get('type') == 'iframe']

        if not iframe_targets:
            logger.debug('No OOPIF targets found')
            return []

        shadow_roots: list[ShadowRoot] = []
        for target in iframe_targets:
            roots = await self._collect_shadow_roots_from_oopif_target(target, browser_handler)
            shadow_roots.extend(roots)

        logger.debug(f'Found {len(shadow_roots)} shadow roots in OOPIFs')
        return shadow_roots

    async def _collect_shadow_roots_from_oopif_target(
        self,
        target: TargetInfo,
        browser_handler: ConnectionHandler,
    ) -> list[ShadowRoot]:
        """Collect shadow roots from a single OOPIF target."""
        target_id = target.get('targetId', '')
        try:
            attach_response: AttachToTargetResponse = await browser_handler.execute_command(
                TargetCommands.attach_to_target(target_id=target_id, flatten=True)
            )
            session_id = attach_response.get('result', {}).get('sessionId')
            if not session_id:
                return []
        except (CommandExecutionTimeout, WebSocketConnectionClosed):
            logger.debug(f'Failed to attach to OOPIF target: {target_id}')
            return []

        try:
            get_doc_command = DomCommands.get_document(depth=-1, pierce=True)
            get_doc_command['sessionId'] = session_id
            doc_response: GetDocumentResponse = await browser_handler.execute_command(
                get_doc_command
            )
            root_node = doc_response.get('result', {}).get('root', {})
        except (CommandExecutionTimeout, WebSocketConnectionClosed):
            logger.debug(f'Failed to get document from OOPIF target: {target_id}')
            return []

        entries: list[tuple[Node, int | None]] = []
        self._collect_shadow_roots_from_tree(root_node, entries)

        iframe_context = IFrameContext(
            frame_id=target_id,
            session_handler=browser_handler,
            session_id=session_id,
        )

        results: list[ShadowRoot] = []
        for shadow_data, host_backend_id in entries:
            sr = await self._resolve_oopif_shadow_entry(
                shadow_data, host_backend_id, browser_handler, session_id, iframe_context
            )
            if sr:
                results.append(sr)
        return results

    async def _resolve_oopif_shadow_entry(
        self,
        shadow_data: Node,
        host_backend_id: int | None,
        browser_handler: ConnectionHandler,
        session_id: str,
        iframe_context: IFrameContext,
    ) -> ShadowRoot | None:
        """Resolve a single shadow root entry from an OOPIF."""
        backend_node_id = shadow_data.get('backendNodeId')
        if not backend_node_id:
            return None

        try:
            resolve_command = DomCommands.resolve_node(backend_node_id=backend_node_id)
            resolve_command['sessionId'] = session_id
            resolve_response: ResolveNodeResponse = await browser_handler.execute_command(
                resolve_command
            )
            shadow_object_id = resolve_response['result']['object']['objectId']
        except (CommandExecutionTimeout, WebSocketConnectionClosed, KeyError):
            logger.debug(f'Failed to resolve OOPIF shadow root: backend_node_id={backend_node_id}')
            return None

        host_element = await self._resolve_oopif_shadow_host(
            host_backend_id, browser_handler, session_id
        )

        if host_element:
            host_element._iframe_context = iframe_context

        mode = ShadowRootType(shadow_data.get('shadowRootType', 'open'))
        sr = ShadowRoot(
            object_id=shadow_object_id,
            connection_handler=self._connection_handler,
            mode=mode,
            host_element=host_element,
        )

        if not host_element:
            sr._iframe_context = iframe_context

        return sr

    async def _resolve_oopif_shadow_host(
        self,
        host_backend_id: int | None,
        browser_handler: ConnectionHandler,
        session_id: str,
    ) -> WebElement | None:
        """Resolve the host element for a shadow root inside an OOPIF (best-effort)."""
        if not host_backend_id:
            return None

        try:
            resolve_command = DomCommands.resolve_node(backend_node_id=host_backend_id)
            resolve_command['sessionId'] = session_id
            host_response: ResolveNodeResponse = await browser_handler.execute_command(
                resolve_command
            )
            host_object_id = host_response['result']['object']['objectId']

            describe_command = DomCommands.describe_node(object_id=host_object_id)
            describe_command['sessionId'] = session_id
            describe_response: DescribeNodeResponse = await browser_handler.execute_command(
                describe_command
            )
            node_info = describe_response.get('result', {}).get('node', {})
            attributes = node_info.get('attributes', [])
            tag_name = node_info.get('nodeName', '').lower()
            attributes.extend(['tag_name', tag_name])

            return WebElement(
                host_object_id,
                self._connection_handler,
                attributes_list=attributes,
                mouse=self._mouse,
            )
        except (CommandExecutionTimeout, WebSocketConnectionClosed, KeyError):
            logger.debug(f'Failed to resolve OOPIF shadow host: backend_node_id={host_backend_id}')
            return None

    @staticmethod
    def _collect_shadow_roots_from_tree(node: Node, results: list[tuple[Node, int | None]]) -> None:
        """Recursively walk a DOM tree collecting shadow root entries."""
        host_backend_id = node.get('backendNodeId')
        for shadow_root in node.get('shadowRoots', []):
            results.append((shadow_root, host_backend_id))
            Tab._collect_shadow_roots_from_tree(shadow_root, results)

        for child in node.get('children', []):
            Tab._collect_shadow_roots_from_tree(child, results)

        content_doc = node.get('contentDocument')
        if content_doc:
            Tab._collect_shadow_roots_from_tree(content_doc, results)

    async def bring_to_front(self):
        """Brings the page to front."""
        logger.info('Bringing page to front')
        return await self._execute_command(PageCommands.bring_to_front())

    async def get_cookies(self) -> list[Cookie]:
        """Get all cookies accessible from current page."""
        logger.debug('Fetching cookies for current page')
        if self._browser_context_id:
            response_storage: StorageGetCookiesResponse = await self._execute_command(
                StorageCommands.get_cookies(self._browser_context_id)
            )
            cookies = response_storage['result']['cookies']
            logger.debug(f'Fetched {len(cookies)} cookies')
            return cookies

        response_network: NetworkGetCookiesResponse = await self._execute_command(
            NetworkCommands.get_cookies()
        )
        cookies = response_network['result']['cookies']
        logger.debug(f'Fetched {len(cookies)} cookies')
        return cookies

    async def get_network_response_body(self, request_id: str) -> str:
        """
        Get the response body for a given request ID.

        Args:
            request_id: Request ID to get the response body for.

        Returns:
            The response body for the given request ID.

        Raises:
            NetworkEventsNotEnabled: If network events are not enabled.
        """
        if not self.network_events_enabled:
            raise NetworkEventsNotEnabled('Network events must be enabled to get response body')

        response: GetResponseBodyResponse = await self._execute_command(
            NetworkCommands.get_response_body(request_id)
        )
        logger.debug(f'Retrieved network response body for request_id={request_id}')
        return response['result']['body']

    async def get_network_logs(self, filter: Optional[str] = None) -> list[RequestWillBeSentEvent]:
        """
        Get network logs.

        Args:
            filter: Filter to apply to the network logs.

        Returns:
            The network logs.

        Raises:
            NetworkEventsNotEnabled: If network events are not enabled.
        """
        if not self.network_events_enabled:
            raise NetworkEventsNotEnabled('Network events must be enabled to get network logs')

        logs = self._connection_handler.network_logs
        if filter:
            logs = [
                log for log in logs if filter in log['params'].get('request', {}).get('url', '')
            ]
        logger.debug(f'Returning {len(logs)} network logs (filtered={bool(filter)})')
        return logs

    async def set_cookies(self, cookies: list[CookieParam]):
        """
        Set multiple cookies for current page.

        Args:
            cookies: Cookie parameters (name/value required, others optional).

        Note:
            Defaults to current page's domain if not specified.
        """
        logger.info(f'Setting {len(cookies)} cookies on current page')
        return await self._execute_command(
            StorageCommands.set_cookies(cookies, self._browser_context_id)
        )

    async def delete_all_cookies(self):
        """Delete all cookies from current browser context."""
        logger.info('Clearing all cookies from current browser context')
        return await self._execute_command(StorageCommands.clear_cookies(self._browser_context_id))

    async def go_to(self, url: str, timeout: int = 300):
        """
        Navigate to URL and wait for loading to complete.

        Refreshes if URL matches current page.

        Args:
            url: Target URL to navigate to.
            timeout: Maximum seconds to wait for page load (default 300).

        Raises:
            PageLoadTimeout: If page doesn't finish loading within timeout.
        """
        logger.info(f'Navigating to URL: {url} (timeout={timeout}s)')
        if await self._refresh_if_url_not_changed(url):
            logger.debug('URL matches current page; refreshing instead')
            return

        async with self._wait_page_load(timeout=timeout):
            await self._execute_command(PageCommands.navigate(url))
        logger.info(f'Navigation complete: {url}')

    async def refresh(
        self,
        ignore_cache: bool = False,
        script_to_evaluate_on_load: Optional[str] = None,
    ):
        """
        Reload current page and wait for completion.

        Args:
            ignore_cache: Bypass browser cache if True.
            script_to_evaluate_on_load: JavaScript to execute after load.

        Raises:
            PageLoadTimeout: If page doesn't finish loading within timeout.
        """
        logger.info(
            f'Reloading page (ignore_cache={ignore_cache}, '
            f'script_on_load={bool(script_to_evaluate_on_load)})'
        )
        async with self._wait_page_load():
            await self._execute_command(
                PageCommands.reload(
                    ignore_cache=ignore_cache,
                    script_to_evaluate_on_load=script_to_evaluate_on_load,
                )
            )
        logger.info('Page reloaded successfully')

    async def take_screenshot(
        self,
        path: Optional[str | Path] = None,
        quality: int = 100,
        beyond_viewport: bool = False,
        as_base64: bool = False,
    ) -> Optional[str]:
        """
        Capture screenshot of current page.

        Args:
            path: File path for screenshot (extension determines format).
            quality: Image quality 0-100 (default 100).
            beyond_viewport: The page will be scrolled to the bottom and the screenshot will
                include the entire page
            as_base64: Return as base64 string instead of saving file.

        Returns:
            Base64 screenshot data if as_base64=True, None otherwise.

        Raises:
            InvalidFileExtension: If file extension not supported.
            MissingScreenshotPath: If path is None and as_base64 is False.
        """
        if not path and not as_base64:
            raise MissingScreenshotPath()

        if path and isinstance(path, str):
            output_extension = path.split('.')[-1]
        elif path and isinstance(path, Path):
            output_extension = path.suffix.lstrip('.')
        else:
            output_extension = ScreenshotFormat.JPEG

        # Normalize jpg to jpeg (CDP only accepts jpeg)
        output_extension = (
            output_extension.replace('jpg', 'jpeg')
            if output_extension == 'jpg'
            else output_extension
        )

        if not ScreenshotFormat.has_value(output_extension):
            raise InvalidFileExtension(f'{output_extension} extension is not supported.')

        output_format = ScreenshotFormat.get_value(output_extension)

        logger.info(
            f'Taking screenshot: path={path}, quality={quality}, '
            f'beyond_viewport={beyond_viewport}, as_base64={as_base64}'
        )
        response: CaptureScreenshotResponse = await self._execute_command(
            PageCommands.capture_screenshot(
                format=output_format,
                quality=quality,
                capture_beyond_viewport=beyond_viewport,
            )
        )

        try:
            screenshot_data = response['result']['data']
        except KeyError:
            raise TopLevelTargetRequired(
                'Command can only be executed on top-level targets. Please use '
                'take_screenshot method on the WebElement object instead.'
            )

        if as_base64:
            logger.info('Screenshot captured and returned as base64')
            return screenshot_data

        if path:
            screenshot_bytes = decode_base64_to_bytes(screenshot_data)
            async with aiofiles.open(str(path), 'wb') as file:
                await file.write(screenshot_bytes)
            logger.info(f'Screenshot saved to: {path}')

        return None

    async def print_to_pdf(
        self,
        path: Optional[str | Path] = None,
        landscape: bool = False,
        display_header_footer: bool = False,
        print_background: bool = True,
        scale: float = 1.0,
        as_base64: bool = False,
    ) -> Optional[str]:
        """
        Generate PDF of current page.

        Args:
            path: File path for PDF output. Required if as_base64=False.
            landscape: Use landscape orientation.
            display_header_footer: Include header/footer.
            print_background: Include background graphics.
            scale: Scale factor (0.1-2.0).
            as_base64: Return as base64 string instead of saving.

        Returns:
            Base64 PDF data if as_base64=True, None otherwise.

        Raises:
            ValueError: If path is not provided when as_base64=False.
        """
        logger.info(
            f'Generating PDF: path={path}, landscape={landscape}, '
            f'header_footer={display_header_footer}, print_bg={print_background}, '
            f'scale={scale}, as_base64={as_base64}'
        )
        response: PrintToPDFResponse = await self._execute_command(
            PageCommands.print_to_pdf(
                landscape=landscape,
                display_header_footer=display_header_footer,
                print_background=print_background,
                scale=scale,
            )
        )
        pdf_data = response['result']['data']
        if as_base64:
            logger.info('PDF generated and returned as base64')
            return pdf_data

        if path is None:
            raise ValueError('path is required when as_base64=False')

        pdf_bytes = decode_base64_to_bytes(pdf_data)
        async with aiofiles.open(path, 'wb') as file:
            await file.write(pdf_bytes)
        logger.info(f'PDF saved to: {path}')

        return None

    async def save_bundle(self, path: str | Path, inline_assets: bool = False) -> None:
        """
        Save current page and its assets as a .zip bundle for offline viewing.

        Captures the page HTML along with CSS, JS, images, fonts, and media
        into a single zip archive. The archive contains an ``index.html`` with
        URLs rewritten to reference local asset files.

        Args:
            path: Destination path for the ``.zip`` file.
            inline_assets: When True, embed all assets directly into
                ``index.html`` using data URIs, ``<style>``, and ``<script>``
                tags instead of saving them as separate files.

        Raises:
            InvalidFileExtension: If path does not end with ``.zip``.
        """
        path = Path(path)
        if path.suffix.lower() != '.zip':
            raise InvalidFileExtension(f'Expected .zip extension, got {path.suffix!r}')

        logger.info(f'Saving page bundle: path={path}, inline={inline_assets}')

        page_was_enabled = self.page_events_enabled
        if not page_was_enabled:
            await self.enable_page_events()

        try:
            tree_response: GetResourceTreeResponse = await self._execute_command(
                PageCommands.get_resource_tree()
            )
            frame_tree: FrameResourceTree = tree_response['result']['frameTree']
            page_url = frame_tree['frame']['url']
            html = await self._fetch_document_html(frame_tree)
            asset_map = await self._fetch_bundle_assets(frame_tree, page_url)

            buf = io.BytesIO()
            with zipfile.ZipFile(buf, 'w', zipfile.ZIP_DEFLATED) as zf:
                if inline_assets:
                    html = inline_all_assets(html, asset_map)
                else:
                    html = rewrite_html_urls(html, asset_map)
                zf.writestr('index.html', html.encode('utf-8'))
                if not inline_assets:
                    for _url, (filename, data, _mime, _rtype) in asset_map.items():
                        zf.writestr(f'assets/{filename}', data)

            async with aiofiles.open(path, 'wb') as f:
                await f.write(buf.getvalue())
            logger.info(f'Page bundle saved to: {path}')
        finally:
            if not page_was_enabled:
                await self.disable_page_events()

    async def _fetch_document_html(self, frame_tree: FrameResourceTree) -> str:
        """Fetch the main document HTML from the frame tree."""
        frame_id = frame_tree['frame']['id']
        page_url = frame_tree['frame']['url']
        try:
            doc_response: GetResourceContentResponse = await self._execute_command(
                PageCommands.get_resource_content(frame_id, page_url)
            )
            result = doc_response['result']
            html = result['content']
            if result.get('base64Encoded'):
                html = _b64.b64decode(html).decode('utf-8', errors='replace')
            return html
        except Exception:
            logger.debug('getResourceContent failed for document, falling back to JS')
            response = await self.execute_script('return document.documentElement.outerHTML')
            return cast(str, response['result']['result']['value'])

    async def _fetch_bundle_assets(
        self,
        frame_tree: FrameResourceTree,
        page_url: str,
    ) -> dict[str, tuple[str, bytes, str, ResourceType]]:
        """Fetch all bundleable resources and return an asset map."""
        all_resources = collect_frame_resources(frame_tree)
        fetchable = filter_fetchable_resources(all_resources, page_url)

        fetch_tasks: list[Awaitable[GetResourceContentResponse]] = [
            self._execute_command(PageCommands.get_resource_content(fid, res['url']))
            for fid, res in fetchable
        ]
        results = await asyncio.gather(*fetch_tasks, return_exceptions=True)

        asset_map: dict[str, tuple[str, bytes, str, ResourceType]] = {}
        for idx, ((_fid, res), result) in enumerate(zip(fetchable, results)):
            if isinstance(result, BaseException):
                logger.warning(f'Failed to fetch resource {res["url"]}: {result}')
                continue
            response: GetResourceContentResponse = result
            content_result = response.get('result')
            if content_result is None:
                logger.warning(f'No result for resource {res["url"]}: {response.get("error")}')
                continue
            raw_content: str = content_result['content']
            is_base64: bool = content_result.get('base64Encoded', False)
            data = _b64.b64decode(raw_content) if is_base64 else raw_content.encode('utf-8')
            filename = build_asset_filename(res['url'], res['mimeType'], idx)
            asset_map[res['url']] = (filename, data, res['mimeType'], res['type'])
        return asset_map

    async def has_dialog(self) -> bool:
        """
        Check if JavaScript dialog is currently displayed.

        Note:
            Page events must be enabled to detect dialogs.
        """
        if self._connection_handler.dialog:
            logger.debug('Dialog present')
            return True

        return False

    async def get_dialog_message(self) -> str:
        """
        Get message text from current JavaScript dialog.

        Raises:
            NoDialogPresent: If no dialog is currently displayed.
        """
        if not await self.has_dialog():
            raise NoDialogPresent()
        message = self._connection_handler.dialog['params']['message']
        logger.debug(f'Dialog message retrieved: {message}')
        return message

    async def handle_dialog(self, accept: bool, prompt_text: Optional[str] = None):
        """
        Respond to JavaScript dialog.

        Args:
            accept: Accept/confirm dialog if True, dismiss/cancel if False.
            prompt_text: Text for prompt dialogs (ignored for alert/confirm).

        Raises:
            NoDialogPresent: If no dialog is currently displayed.

        Note:
            Page events must be enabled to handle dialogs.
        """
        if not await self.has_dialog():
            raise NoDialogPresent()
        logger.info(f'Handling dialog: accept={accept}, has_prompt_text={bool(prompt_text)}')
        return await self._execute_command(
            PageCommands.handle_javascript_dialog(accept=accept, prompt_text=prompt_text)
        )

    @overload
    async def execute_script(
        self,
        script: str,
        *,
        object_group: Optional[str] = None,
        include_command_line_api: Optional[bool] = None,
        silent: Optional[bool] = None,
        context_id: Optional[int] = None,
        return_by_value: Optional[bool] = None,
        generate_preview: Optional[bool] = None,
        user_gesture: Optional[bool] = None,
        await_promise: Optional[bool] = None,
        throw_on_side_effect: Optional[bool] = None,
        timeout: Optional[float] = None,
        disable_breaks: Optional[bool] = None,
        repl_mode: Optional[bool] = None,
        allow_unsafe_eval_blocked_by_csp: Optional[bool] = None,
        unique_context_id: Optional[str] = None,
        serialization_options: Optional[SerializationOptions] = None,
    ) -> EvaluateResponse: ...

    @overload
    async def execute_script(
        self,
        script: str,
        element: WebElement,
        *,
        arguments: Optional[list[CallArgument]] = None,
        silent: Optional[bool] = None,
        return_by_value: Optional[bool] = None,
        generate_preview: Optional[bool] = None,
        user_gesture: Optional[bool] = None,
        await_promise: Optional[bool] = None,
        execution_context_id: Optional[int] = None,
        object_group: Optional[str] = None,
        throw_on_side_effect: Optional[bool] = None,
        unique_context_id: Optional[str] = None,
        serialization_options: Optional[SerializationOptions] = None,
    ) -> CallFunctionOnResponse: ...

    async def execute_script(
        self,
        script: str,
        element: Optional[WebElement] = None,
        *,
        arguments: Optional[list[CallArgument]] = None,
        object_group: Optional[str] = None,
        include_command_line_api: Optional[bool] = None,
        silent: Optional[bool] = None,
        context_id: Optional[int] = None,
        return_by_value: Optional[bool] = None,
        generate_preview: Optional[bool] = None,
        user_gesture: Optional[bool] = None,
        await_promise: Optional[bool] = None,
        execution_context_id: Optional[int] = None,
        throw_on_side_effect: Optional[bool] = None,
        timeout: Optional[float] = None,
        disable_breaks: Optional[bool] = None,
        repl_mode: Optional[bool] = None,
        allow_unsafe_eval_blocked_by_csp: Optional[bool] = None,
        unique_context_id: Optional[str] = None,
        serialization_options: Optional[SerializationOptions] = None,
    ) -> Union[EvaluateResponse, CallFunctionOnResponse]:
        """
        Execute JavaScript in page context.

        Args:
            script (str): JavaScript code to execute.
            element (Optional[WebElement]): Optional WebElement to execute script on.
            arguments (Optional[list[CallArgument]]): Arguments to pass to the function.
            object_group (Optional[str]): Symbolic group name for the result (Runtime.evaluate).
            include_command_line_api (Optional[bool]): Whether to include command line API
                (Runtime.evaluate).
            silent (Optional[bool]): Whether to silence exceptions (Runtime.evaluate).
            context_id (Optional[int]): ID of the execution context to evaluate in
                (Runtime.evaluate).
            return_by_value (Optional[bool]): Whether to return the result by value instead of
                reference (Runtime.evaluate).
            generate_preview (Optional[bool]): Whether to generate a preview for the result
                (Runtime.evaluate).
            user_gesture (Optional[bool]): Whether to treat evaluation as initiated by user
                gesture (Runtime.evaluate).
            await_promise (Optional[bool]): Whether to await promise result (Runtime.evaluate).
            execution_context_id (Optional[int]): ID of the execution context to call the
                function in.
            throw_on_side_effect (Optional[bool]): Whether to throw if side effect cannot be
                ruled out (Runtime.evaluate).
            timeout (Optional[float]): Timeout in milliseconds (Runtime.evaluate).
            disable_breaks (Optional[bool]): Whether to disable breakpoints during evaluation
                (Runtime.evaluate).
            repl_mode (Optional[bool]): Whether to execute in REPL mode (Runtime.evaluate).
            allow_unsafe_eval_blocked_by_csp (Optional[bool]): Allow unsafe evaluation
                (Runtime.evaluate).
            unique_context_id (Optional[str]): Unique context ID for evaluation
                (Runtime.evaluate).
            serialization_options (Optional[SerializationOptions]): Serialization options for
                the result (Runtime.evaluate).

        Returns:
            Union[EvaluateResponse, CallFunctionOnResponse]: The result of the script execution.

        Raises:
            InvalidScriptWithElement: If script uses 'argument' keyword but no element is provided.

        Examples:
            # Execute a simple script to log a message
            await page.execute_script('console.log("Hello World")')

            # Execute a script that returns the page title
            await page.execute_script('return document.title')

            # Execute a script on an element to click it
            await page.execute_script('argument.click()', element)

            # Execute a script on an element to set its value
            await page.execute_script('argument.value = "Hello"', element)
        """
        logger.debug(f'Executing script: with_element={bool(element)}, length={len(script)}')
        if element is not None:
            warnings.warn(
                'Passing a WebElement to Tab.execute_script() is deprecated. '
                'Use WebElement.execute_script() instead.',
                DeprecationWarning,
                stacklevel=2,
            )

            return await element.execute_script(
                script,
                arguments=arguments,
                silent=silent,
                return_by_value=return_by_value,
                generate_preview=generate_preview,
                user_gesture=user_gesture,
                await_promise=await_promise,
                execution_context_id=execution_context_id,
                object_group=object_group,
                throw_on_side_effect=throw_on_side_effect,
                unique_context_id=unique_context_id,
                serialization_options=serialization_options,
            )

        if has_return_outside_function(script):
            script = f'(function(){{ {script} }})()'

        command = self._get_evaluate_command(
            script,
            object_group=object_group,
            include_command_line_api=include_command_line_api,
            silent=silent,
            context_id=context_id,
            return_by_value=return_by_value,
            generate_preview=generate_preview,
            user_gesture=user_gesture,
            await_promise=await_promise,
            throw_on_side_effect=throw_on_side_effect,
            timeout=timeout,
            disable_breaks=disable_breaks,
            repl_mode=repl_mode,
            allow_unsafe_eval_blocked_by_csp=allow_unsafe_eval_blocked_by_csp,
            unique_context_id=unique_context_id,
            serialization_options=serialization_options,
        )
        logger.debug(f'Executing script without element: length={len(script)}')
        result: Union[EvaluateResponse, CallFunctionOnResponse] = await self._execute_command(
            command
        )
        self._validate_argument_error(result)
        return result

    # TODO: think about how to remove these duplications with the base class
    async def continue_request(
        self,
        request_id: str,
        url: Optional[str] = None,
        method: Optional[RequestMethod] = None,
        post_data: Optional[str] = None,
        headers: Optional[list[HeaderEntry]] = None,
        intercept_response: Optional[bool] = None,
    ):
        """
        Continue paused request without modifications.
        """
        logger.debug(f'Continue request on tab: id={request_id}')
        return await self._execute_command(
            FetchCommands.continue_request(
                request_id=request_id,
                url=url,
                method=method,
                post_data=post_data,
                headers=headers,
                intercept_response=intercept_response,
            )
        )

    async def fail_request(self, request_id: str, error_reason: ErrorReason):
        """Fail request with error code."""
        logger.debug(f'Fail request on tab: id={request_id}, reason={error_reason}')
        return await self._execute_command(FetchCommands.fail_request(request_id, error_reason))

    async def fulfill_request(
        self,
        request_id: str,
        response_code: int,
        response_headers: Optional[list[HeaderEntry]] = None,
        body: Optional[str] = None,
        response_phrase: Optional[str] = None,
    ):
        """Fulfill request with response data."""
        logger.debug(
            f'Fulfill request on tab: id={request_id}, code={response_code}, '
            f'headers_set={bool(response_headers)}, body_set={bool(body)}'
        )
        return await self._execute_command(
            FetchCommands.fulfill_request(
                request_id=request_id,
                response_code=response_code,
                response_headers=response_headers,
                body=body,
                response_phrase=response_phrase,
            )
        )

    async def continue_with_auth(
        self,
        request_id: str,
        auth_challenge_response: AuthChallengeResponseType,
        proxy_username: Optional[str] = None,
        proxy_password: Optional[str] = None,
    ):
        """Continue a paused request replying to an authentication challenge.

        Useful for proxy auth (407) or server auth (401) when Fetch is enabled
        with handle_auth=True.
        """
        logger.debug(
            f'Continue with auth on tab: id={request_id}, response={auth_challenge_response}, '
            f'user_set={bool(proxy_username)}'
        )
        return await self._execute_command(
            FetchCommands.continue_request_with_auth(
                request_id=request_id,
                auth_challenge_response=auth_challenge_response,
                proxy_username=proxy_username,
                proxy_password=proxy_password,
            )
        )

    @asynccontextmanager
    async def expect_file_chooser(
        self, files: str | Path | list[str | Path]
    ) -> AsyncGenerator[None, None]:
        """
        Context manager for automatic file upload handling.

        Args:
            files: File path(s) for upload.
        """

        async def event_handler(event: FileChooserOpenedEvent):
            logger.info('File chooser opened; setting files')
            file_list = [str(file) for file in files] if isinstance(files, list) else [str(files)]
            await self._execute_command(
                DomCommands.set_file_input_files(
                    files=file_list,
                    backend_node_id=event['params']['backendNodeId'],
                )
            )
            logger.debug(f'Files set on input: {file_list}')

        if self.page_events_enabled is False:
            _before_page_events_enabled = False
            await self.enable_page_events()
        else:
            _before_page_events_enabled = True

        if self.intercept_file_chooser_dialog_enabled is False:
            await self.enable_intercept_file_chooser_dialog()

        logger.info('Waiting for file chooser to open')
        await self.on(
            PageEvent.FILE_CHOOSER_OPENED,
            cast(Callable[[dict], Any], event_handler),
            temporary=True,
        )

        yield

        if self.intercept_file_chooser_dialog_enabled is True:
            await self.disable_intercept_file_chooser_dialog()

        if _before_page_events_enabled is False:
            await self.disable_page_events()

    @asynccontextmanager
    async def expect_and_bypass_cloudflare_captcha(
        self,
        custom_selector: Optional[tuple[By, str]] = None,
        time_before_click: Optional[float] = None,
        time_to_wait_captcha: float = 5,
    ) -> AsyncGenerator[None, None]:
        """
        Context manager for automatic Cloudflare captcha bypass.

        Args:
            custom_selector: Deprecated — ignored. Cloudflare Turnstile is now
                detected automatically via shadow root inspection.
            time_before_click: Deprecated — ignored. The checkbox is now
                located via shadow root polling and clicked immediately.
            time_to_wait_captcha: Timeout for captcha detection (default 5s).
        """
        if custom_selector is not None:
            warnings.warn(
                'custom_selector is deprecated and ignored. Cloudflare Turnstile is now '
                'detected automatically via shadow root inspection.',
                DeprecationWarning,
                stacklevel=2,
            )

        if time_before_click is not None:
            warnings.warn(
                'time_before_click is deprecated and ignored. The checkbox is now '
                'located via shadow root polling and clicked immediately.',
                DeprecationWarning,
                stacklevel=2,
            )

        captcha_processed = asyncio.Event()

        async def bypass_cloudflare(_: dict):
            try:
                await self._bypass_cloudflare(
                    _,
                    time_to_wait_captcha=time_to_wait_captcha,
                )
            finally:
                captcha_processed.set()

        _before_page_events_enabled = self.page_events_enabled

        if not _before_page_events_enabled:
            await self.enable_page_events()

        logger.info('Expecting and bypassing Cloudflare captcha if present')
        callback_id = await self.on(PageEvent.LOAD_EVENT_FIRED, bypass_cloudflare)

        try:
            yield
            await captcha_processed.wait()
        finally:
            await self._connection_handler.remove_callback(callback_id)
            if not _before_page_events_enabled:
                await self.disable_page_events()

    @asynccontextmanager
    async def expect_download(
        self,
        keep_file_at: Optional[Union[str, Path]] = None,
        timeout: Optional[float] = None,
    ) -> AsyncGenerator[_DownloadHandle, None]:
        """
        Context manager for handling a file download triggered inside the block.

        Behavior:
        - If keep_file_at is provided, configure browser to save into that directory and keep file.
        - Otherwise, a temporary directory is used and cleaned up after the context.

        Args:
            keep_file_at: Directory to persist the file. If None, uses a temporary
                directory and cleans it up afterwards.
            timeout: Max seconds to wait for download completion. Defaults to 60.

        Yields:
            _DownloadHandle: Handle to read the downloaded file (bytes/base64) and check its path.
        """
        download_timeout = 60.0 if timeout is None else float(timeout)

        cleanup_dir = False
        if keep_file_at is None:
            download_dir = mkdtemp(prefix='pydoll-download-')
            cleanup_dir = True
        else:
            download_dir = str(Path(keep_file_at))
            Path(download_dir).mkdir(parents=True, exist_ok=True)

        logger.info(f'Expecting download (dir={download_dir}, timeout={download_timeout}s)')
        await self._browser.set_download_behavior(
            behavior=DownloadBehavior.ALLOW,
            download_path=download_dir,
            browser_context_id=self._browser_context_id,
        )

        _page_events_was_enabled = True
        if not self._page_events_enabled:
            _page_events_was_enabled = False
            await self.enable_page_events()

        loop = asyncio.get_event_loop()
        will_begin: asyncio.Future[bool] = loop.create_future()
        done: asyncio.Future[bool] = loop.create_future()
        state: dict[str, Any] = {
            'guid': None,
            'url': None,
            'suggestedFilename': None,
            'filePath': None,
            'dir': download_dir,
        }

        async def on_will_begin(event: DownloadWillBeginEvent):
            params = event['params']
            state['guid'] = params['guid']
            state['url'] = params['url']
            state['suggestedFilename'] = params['suggestedFilename']
            if not will_begin.done():
                will_begin.set_result(True)
            logger.info(
                f'Download will begin: url={state["url"]}, filename={state["suggestedFilename"]}'
            )

        async def on_progress(event: DownloadProgressEvent):
            params = event['params']
            guid = params['guid']
            if (
                state.get('guid')
                and guid != state['guid']
                or params['state'] != DownloadProgressState.COMPLETED
            ):
                return
            file_path = params.get('filePath')
            if not file_path:
                file_path = str(Path(download_dir) / state['suggestedFilename'])
            state['filePath'] = file_path
            if not done.done():
                done.set_result(True)
            logger.info(f'Download completed: {file_path}')

        await self.on(
            PageEvent.DOWNLOAD_WILL_BEGIN,
            cast(Callable[[dict], Awaitable[Any]], on_will_begin),
            True,
        )
        cb_id_progress = await self.on(
            PageEvent.DOWNLOAD_PROGRESS,
            cast(Callable[[dict], Awaitable[Any]], on_progress),
            False,
        )

        handle = _DownloadHandle(
            state=state,
            will_begin_future=will_begin,
            done_future=done,
            timeout=download_timeout,
        )

        try:
            yield handle
            try:
                await asyncio.wait_for(done, timeout=download_timeout)
            except asyncio.TimeoutError as exc:
                raise DownloadTimeout() from exc
        finally:
            await self._cleanup_download_context(
                cb_id_progress,
                _page_events_was_enabled,
                cleanup_dir,
                state,
                download_dir,
            )

    async def _cleanup_download_context(
        self,
        cb_id_progress: int,
        page_events_was_enabled: bool,
        cleanup_dir: bool,
        state: dict[str, Any],
        download_dir: str,
    ) -> None:
        await self.remove_callback(cb_id_progress)
        await self._browser.set_download_behavior(
            behavior=DownloadBehavior.DEFAULT,
            browser_context_id=self._browser_context_id,
        )

        if cleanup_dir:
            file_path = state['filePath']
            if not file_path:
                return
            Path(file_path).unlink(missing_ok=True)
            shutil.rmtree(download_dir, ignore_errors=True)

        if not page_events_was_enabled:
            await self.disable_page_events()

    @overload
    async def on(
        self, event_name: str, callback: Callable[[dict], Any], temporary: bool = False
    ) -> int: ...
    @overload
    async def on(
        self, event_name: str, callback: Callable[[dict], Awaitable[Any]], temporary: bool = False
    ) -> int: ...
    async def on(
        self,
        event_name,
        callback,
        temporary=False,
    ) -> int:
        """
        Register CDP event listener.

        Callback runs in background task to prevent blocking.

        Args:
            event_name: CDP event name (e.g., 'Page.loadEventFired').
            callback: Function called on event (sync or async).
            temporary: Remove after first invocation.

        Returns:
            Callback ID for removal.

        Note:
            Corresponding domain must be enabled before events fire.
        """

        async def callback_wrapper(event):
            asyncio.create_task(callback(event))

        if asyncio.iscoroutinefunction(callback):
            function_to_register = callback_wrapper
        else:
            function_to_register = callback

        logger.debug(
            f'Registering callback on tab: event={event_name}, temporary={temporary}, '
            f'async={asyncio.iscoroutinefunction(callback)}'
        )
        return await self._connection_handler.register_callback(
            event_name, function_to_register, temporary
        )

    async def remove_callback(self, callback_id: int):
        """Remove callback from tab."""
        logger.debug(f'Removing callback from tab: id={callback_id}')
        return await self._connection_handler.remove_callback(callback_id)

    async def clear_callbacks(self):
        """Clear all registered event callbacks."""
        logger.debug('Clearing all callbacks from tab')
        await self._connection_handler.clear_callbacks()

    def _get_connection_handler(self) -> ConnectionHandler:
        if self._ws_address:
            logger.debug('Using WebSocket address for connection handler')
            return ConnectionHandler(ws_address=self._ws_address)
        logger.debug(
            'Using port/target for connection handler: '
            f'port={self._connection_port}, target_id={self._target_id}'
        )
        return ConnectionHandler(self._connection_port, self._target_id)

    @staticmethod
    def _get_evaluate_command(
        script: str,
        *,
        object_group: Optional[str] = None,
        include_command_line_api: Optional[bool] = None,
        silent: Optional[bool] = None,
        context_id: Optional[int] = None,
        return_by_value: Optional[bool] = None,
        generate_preview: Optional[bool] = None,
        user_gesture: Optional[bool] = None,
        await_promise: Optional[bool] = None,
        throw_on_side_effect: Optional[bool] = None,
        timeout: Optional[float] = None,
        disable_breaks: Optional[bool] = None,
        repl_mode: Optional[bool] = None,
        allow_unsafe_eval_blocked_by_csp: Optional[bool] = None,
        unique_context_id: Optional[str] = None,
        serialization_options: Optional[SerializationOptions] = None,
    ):
        """Create an evaluate command with the given parameters."""
        return RuntimeCommands.evaluate(
            expression=script,
            object_group=object_group,
            include_command_line_api=include_command_line_api,
            silent=silent,
            context_id=context_id,
            return_by_value=return_by_value,
            generate_preview=generate_preview,
            user_gesture=user_gesture,
            await_promise=await_promise,
            throw_on_side_effect=throw_on_side_effect,
            timeout=timeout,
            disable_breaks=disable_breaks,
            repl_mode=repl_mode,
            allow_unsafe_eval_blocked_by_csp=allow_unsafe_eval_blocked_by_csp,
            unique_context_id=unique_context_id,
            serialization_options=serialization_options,
        )

    async def _refresh_if_url_not_changed(self, url: str) -> bool:
        """Refresh page if URL hasn't changed."""
        current_url = await self.current_url
        if current_url == url:
            await self.refresh()
            return True
        return False

    @staticmethod
    def _validate_argument_error(response: EvaluateResponse) -> None:
        """
        Validate that script didn't fail with ReferenceError about 'argument' being undefined.

        Raises:
            InvalidScriptWithElement: If script uses 'argument' keyword but no element was provided.
        """
        evaluate_result = response.get('result')
        if not isinstance(evaluate_result, dict):
            return

        remote_object = evaluate_result.get('result')
        if not isinstance(remote_object, dict):
            return

        if not (
            remote_object.get('type') == 'object'
            and remote_object.get('subtype') == 'error'
            and remote_object.get('className') == 'ReferenceError'
        ):
            return

        description = remote_object.get('description', '')
        if 'argument is not defined' in description:
            raise InvalidScriptWithElement('Script contains "argument" but no element was provided')

    _PAGE_LOAD_EVENT_MAP = {
        PageLoadState.INTERACTIVE: PageEvent.DOM_CONTENT_EVENT_FIRED,
        PageLoadState.COMPLETE: PageEvent.LOAD_EVENT_FIRED,
    }

    @asynccontextmanager
    async def _wait_page_load(self, timeout: int = 300):
        """Wait for page to reach the configured load state using CDP events.

        Registers a CDP event listener **before** yielding so the navigation
        command can be issued inside the ``async with`` block without race
        conditions.  This replaces the former ``document.readyState`` polling
        loop, eliminating the dependency on ``Runtime.evaluate`` during page
        load and the risk of inner command timeouts.

        The CDP event used depends on ``browser.options.page_load_state``:

        * ``INTERACTIVE`` — waits for ``Page.domContentEventFired``.
        * ``COMPLETE`` — waits for ``Page.loadEventFired``.

        Args:
            timeout: Maximum seconds to wait for the target load state.

        Raises:
            PageLoadTimeout: If the page doesn't reach the target state in time.
        """
        target_state = self._browser.options.page_load_state

        page_loaded = asyncio.Event()
        event_name = self._PAGE_LOAD_EVENT_MAP[target_state]
        cleanup_page_events = not self._page_events_enabled

        if cleanup_page_events:
            await self.enable_page_events()

        def on_loaded(_: dict):
            page_loaded.set()

        callback_id = await self.on(event_name, on_loaded)
        logger.debug(f'Waiting for page load via {event_name} (timeout={timeout}s)')

        try:
            yield
            await asyncio.wait_for(page_loaded.wait(), timeout=timeout)
            logger.debug(f'Page load event received: {event_name}')
        except asyncio.TimeoutError:
            logger.error(f'Page load timeout after {timeout}s waiting for {event_name}')
            raise PageLoadTimeout()
        finally:
            with contextlib.suppress(Exception):
                await self.remove_callback(callback_id)
            if cleanup_page_events:
                with contextlib.suppress(Exception):
                    await self.disable_page_events()

    async def _find_cloudflare_shadow_root(self, timeout: float) -> ShadowRoot:
        """Poll for the Cloudflare Turnstile shadow root.

        Repeatedly calls ``find_shadow_roots(deep=False)`` and checks each
        shadow root's ``inner_html`` for the Cloudflare challenge domain.

        Args:
            timeout: Maximum seconds to wait for the shadow root.

        Returns:
            The first ShadowRoot whose inner HTML contains
            ``challenges.cloudflare.com``.

        Raises:
            WaitElementTimeout: If no matching shadow root is found within
                *timeout* seconds.
        """
        start_time = asyncio.get_event_loop().time()
        while True:
            shadow_roots = await self.find_shadow_roots(deep=False)
            for sr in shadow_roots:
                html = await sr.inner_html
                if _CLOUDFLARE_CHALLENGE_DOMAIN in html:
                    return sr

            if asyncio.get_event_loop().time() - start_time > timeout:
                raise WaitElementTimeout(
                    f'Timed out after {timeout}s waiting for Cloudflare Turnstile shadow root'
                )
            await asyncio.sleep(0.5)

    async def _bypass_cloudflare(
        self,
        event: dict,
        time_to_wait_captcha: float = 5,
    ) -> None:
        """Attempt to bypass Cloudflare Turnstile captcha via shadow root traversal.

        Traverses shadow roots to locate the Cloudflare iframe, navigates into
        it, and clicks the actual checkbox element (``span.cb-i``).
        """
        try:
            timeout_int = int(time_to_wait_captcha)
            shadow_root = await self._find_cloudflare_shadow_root(
                timeout=time_to_wait_captcha,
            )
            iframe = await shadow_root.query(_CLOUDFLARE_IFRAME_SELECTOR, timeout=timeout_int)
            body = await iframe.find(tag_name='body', timeout=timeout_int)
            inner_shadow = await body.get_shadow_root(timeout=time_to_wait_captcha)
            checkbox = await inner_shadow.query(_CLOUDFLARE_CHECKBOX_SELECTOR, timeout=timeout_int)
            await checkbox.click()
        except Exception as exc:
            logger.error(f'Error in cloudflare bypass: {exc}')


class _DownloadHandle:
    """Handle returned by expect_download to access the downloaded file."""

    def __init__(
        self,
        state: dict[str, Any],
        will_begin_future: asyncio.Future[bool],
        done_future: asyncio.Future[bool],
        timeout: float,
    ) -> None:
        self._state = state
        self._will_begin_future = will_begin_future
        self._done_future = done_future
        self._timeout = timeout

    @property
    def file_path(self) -> Optional[str]:
        return self._state.get('filePath')

    async def wait_started(self, timeout: Optional[float] = None) -> None:
        await asyncio.wait_for(self._will_begin_future, timeout=timeout or self._timeout)

    async def wait_finished(self, timeout: Optional[float] = None) -> None:
        await asyncio.wait_for(self._done_future, timeout=timeout or self._timeout)

    async def read_bytes(self) -> bytes:
        await self.wait_finished()
        if not self.file_path:
            raise FileNotFoundError('Download file path not available')
        async with aiofiles.open(self.file_path, 'rb') as f:  # type: ignore[arg-type]
            return await f.read()

    async def read_base64(self) -> str:
        data = await self.read_bytes()
        return _b64.b64encode(data).decode('ascii')


================================================
FILE: pydoll/commands/__init__.py
================================================
# global imports
from pydoll.commands.browser_commands import BrowserCommands
from pydoll.commands.dom_commands import DomCommands
from pydoll.commands.emulation_commands import EmulationCommands
from pydoll.commands.fetch_commands import FetchCommands
from pydoll.commands.input_commands import InputCommands
from pydoll.commands.network_commands import NetworkCommands
from pydoll.commands.page_commands import PageCommands
from pydoll.commands.runtime_commands import RuntimeCommands
from pydoll.commands.storage_commands import StorageCommands
from pydoll.commands.target_commands import TargetCommands

__all__ = [
    'DomCommands',
    'EmulationCommands',
    'FetchCommands',
    'InputCommands',
    'NetworkCommands',
    'PageCommands',
    'RuntimeCommands',
    'StorageCommands',
    'BrowserCommands',
    'TargetCommands',
]


================================================
FILE: pydoll/commands/browser_commands.py
================================================
from __future__ import annotations

from typing import TYPE_CHECKING, Optional

from pydoll.protocol.base import Command
from pydoll.protocol.browser.methods import (
    AddPrivacySandboxCoordinatorKeyConfigParams,
    AddPrivacySandboxEnrollmentOverrideParams,
    BrowserMethod,
    CancelDownloadParams,
    ExecuteBrowserCommandParams,
    GetHistogramParams,
    GetHistogramsParams,
    GetWindowBoundsParams,
    GetWindowForTargetParams,
    GrantPermissionsParams,
    ResetPermissionsParams,
    SetContentsSizeParams,
    SetDockTileParams,
    SetDownloadBehaviorParams,
    SetPermissionParams,
    SetWindowBoundsParams,
)
from pydoll.protocol.browser.types import (
    Bounds,
    WindowState,
)

if TYPE_CHECKING:
    from pydoll.protocol.browser.methods import (
        AddPrivacySandboxCoordinatorKeyConfigCommand,
        AddPrivacySandboxEnrollmentOverrideCommand,
        CancelDownloadCommand,
        CloseCommand,
        CrashCommand,
        CrashGpuProcessCommand,
        DownloadBehavior,
        ExecuteBrowserCommandCommand,
        GetBrowserCommandLineCommand,
        GetHistogramCommand,
        GetHistogramsCommand,
        GetVersionCommand,
        GetWindowBoundsCommand,
        GetWindowForTargetCommand,
        GrantPermissionsCommand,
        ResetPermissionsCommand,
        SetContentsSizeCommand,
        SetDockTileCommand,
        SetDownloadBehaviorCommand,
        SetPermissionCommand,
        SetWindowBoundsCommand,
    )
    from pydoll.protocol.browser.types import (
        BrowserCommandId,
        BrowserContextID,
        PermissionDescriptor,
        PermissionSetting,
        PermissionType,
        PrivacySandboxAPI,
        WindowID,
    )


class BrowserCommands:
    """
    BrowserCommands class provides a set of commands to interact with the
    browser's main functionality based on CDP. These commands allow for
    managing browser windows, such as closing windows, retrieving window IDs,
    and adjusting window bounds (size and state).

    The commands defined in this class provide functionality for:
    - Managing browser windows and targets.
    - Setting permissions and download behavior.
    - Controlling browser windows (size, state).
    - Retrieving browser information and versioning.
    """

    @staticmethod
    def get_version() -> GetVersionCommand:
        """
        Generates a command to get browser version information.

        Returns:
            GetVersionCommand: The CDP command that returns browser version details
                including protocol version, product name, revision, and user agent.
        """
        return Command(method=BrowserMethod.GET_VERSION)

    @staticmethod
    def get_browser_command_line() -> GetBrowserCommandLineCommand:
        """
        Returns the command line switches for the browser process.

        Returns:
            GetBrowserCommandLineCommand: The CDP command that returns command line arguments.

        Note: Only works if --enable-automation is on the command line.
        """
        return Command(method=BrowserMethod.GET_BROWSER_COMMAND_LINE)

    @staticmethod
    def get_histograms(
        query: Optional[str] = None,
        delta: bool = False,
    ) -> GetHistogramsCommand:
        """
        Get Chrome histograms.

        Args:
            query: Requested substring in name. Only histograms which have query as a
                   substring in their name are extracted. An empty or absent query returns
                   all histograms.
            delta: If true, retrieve delta since last delta call.

        Returns:
            GetHistogramsCommand: The CDP command that returns histogram data.
        """
        params = GetHistogramsParams()
        if query is not None:
            params['query'] = query
        if delta:
            params['delta'] = delta
        return Command(method=BrowserMethod.GET_HISTOGRAMS, params=params)

    @staticmethod
    def get_histogram(
        name: str,
        delta: bool = False,
    ) -> GetHistogramCommand:
        """
        Get a Chrome histogram by name.

        Args:
            name: Requested histogram name.
            delta: If true, retrieve delta since last delta call.

        Returns:
            GetHistogramCommand: The CDP command that returns histogram data.
        """
        params = GetHistogramParams(name=name)
        if delta:
            params['delta'] = delta
        return Command(method=BrowserMethod.GET_HISTOGRAM, params=params)

    @staticmethod
    def get_window_bounds(window_id: WindowID) -> GetWindowBoundsCommand:
        """
        Get position and size of the browser window.

        Args:
            window_id: Browser window id.

        Returns:
            GetWindowBoundsCommand: The CDP command that returns window bounds information.
        """
        params = GetWindowBoundsParams(windowId=window_id)
        return Command(method=BrowserMethod.GET_WINDOW_BOUNDS, params=params)

    @staticmethod
    def get_window_for_target(
        target_id: Optional[str] = None,
    ) -> GetWindowForTargetCommand:
        """
        Get the browser window that contains the devtools target.

        Args:
            target_id: Devtools agent host id. If called as a part of the session,
                      associated targetId is used.

        Returns:
            GetWindowForTargetCommand: The CDP command that returns window information
                including windowId and bounds.
        """
        params = GetWindowForTargetParams()
        if target_id is not None:
            params['targetId'] = target_id
        return Command(method=BrowserMethod.GET_WINDOW_FOR_TARGET, params=params)

    @staticmethod
    def set_window_bounds(window_id: WindowID, bounds: Bounds) -> SetWindowBoundsCommand:
        """
        Set position and/or size of the browser window.

        Args:
            window_id: Browser window id.
            bounds: New window bounds. The 'minimized', 'maximized' and 'fullscreen' states
                   cannot be combined with 'left', 'top', 'width' or 'height'. Leaves
                   unspecified fields unchanged.

        Returns:
            SetWindowBoundsCommand: The CDP command that sets window bounds.
        """
        params = SetWindowBoundsParams(windowId=window_id, bounds=bounds)
        return Command(method=BrowserMethod.SET_WINDOW_BOUNDS, params=params)

    @staticmethod
    def set_contents_size(
        window_id: WindowID,
        width: Optional[int] = None,
        height: Optional[int] = None,
    ) -> SetContentsSizeCommand:
        """
        Set size of the browser contents resizing browser window as necessary.

        Args:
            window_id: Browser window id.
            width: The window contents width in DIP. Assumes current width if omitted.
                  Must be specified if 'height' is omitted.
            height: The window contents height in DIP. Assumes current height if omitted.
                   Must be specified if 'width' is omitted.

        Returns:
            SetContentsSizeCommand: The CDP command that sets window contents size.
        """
        params = SetContentsSizeParams(windowId=window_id)
        if width is not None:
            params['width'] = width
        if height is not None:
            params['height'] = height
        return Command(method=BrowserMethod.SET_CONTENTS_SIZE, params=params)

    @staticmethod
    def set_dock_tile(
        badge_label: Optional[str] = None,
        image: Optional[str] = None,
    ) -> SetDockTileCommand:
        """
        Set dock tile details, platform-specific.

        Args:
            badge_label: Optional badge label.
            image: Png encoded image (base64 string when passed over JSON).

        Returns:
            SetDockTileCommand: The CDP command that sets dock tile details.
        """
        params = SetDockTileParams()
        if badge_label is not None:
            params['badgeLabel'] = badge_label
        if image is not None:
            params['image'] = image
        return Command(method=BrowserMethod.SET_DOCK_TILE, params=params)

    @staticmethod
    def execute_browser_command(command_id: BrowserCommandId) -> ExecuteBrowserCommandCommand:
        """
        Invoke custom browser commands used by telemetry.

        Args:
            command_id: Browser command identifier.

        Returns:
            ExecuteBrowserCommandCommand: The CDP command that executes browser command.
        """
        params = ExecuteBrowserCommandParams(commandId=command_id)
        return Command(method=BrowserMethod.EXECUTE_BROWSER_COMMAND, params=params)

    @staticmethod
    def add_privacy_sandbox_enrollment_override(
        url: str,
    ) -> AddPrivacySandboxEnrollmentOverrideCommand:
        """
        Allows a site to use privacy sandbox features that require enrollment
        without the site actually being enrolled. Only supported on page targets.

        Args:
            url: Site URL.

        Returns:
            AddPrivacySandboxEnrollmentOverrideCommand: The CDP command that adds enrollment
            override.
        """
        params = AddPrivacySandboxEnrollmentOverrideParams(url=url)
        return Command(method=BrowserMethod.ADD_PRIVACY_SANDBOX_ENROLLMENT_OVERRIDE, params=params)

    @staticmethod
    def add_privacy_sandbox_coordinator_key_config(
        api: PrivacySandboxAPI,
        coordinator_origin: str,
        key_config: str,
        browser_context_id: Optional[BrowserContextID] = None,
    ) -> AddPrivacySandboxCoordinatorKeyConfigCommand:
        """
        Configures encryption keys used with a given privacy sandbox API to talk
        to a trusted coordinator. Since this is intended for test automation only,
        coordinatorOrigin must be a .test domain. No existing coordinator
        configuration for the origin may exist.

        Args:
            api: Privacy Sandbox API type.
            coordinator_origin: Coordinator origin (must be .test domain).
            key_config: Key configuration string.
            browser_context_id: BrowserContext to perform the action in. When omitted,
                               default browser context is used.

        Returns:
            AddPrivacySandboxCoordinatorKeyConfigCommand: The CDP command that adds key config.
        """
        params = AddPrivacySandboxCoordinatorKeyConfigParams(
            api=api,
            coordinatorOrigin=coordinator_origin,
            keyConfig=key_config,
        )
        if browser_context_id is not None:
            params['browserContextId'] = browser_context_id
        return Command(
            method=BrowserMethod.ADD_PRIVACY_SANDBOX_COORDINATOR_KEY_CONFIG, params=params
        )

    @staticmethod
    def set_permission(
        permission: PermissionDescriptor,
        setting: PermissionSetting,
        origin: Optional[str] = None,
        browser_context_id: Optional[BrowserContextID] = None,
    ) -> SetPermissionCommand:
        """
        Set permission settings for given origin.

        Args:
            permission: Descriptor of permission to override.
            setting: Setting of the permission.
            origin: Origin the permission applies to, all origins if not specified.
            browser_context_id: Context to override. When omitted, default browser context is used.

        Returns:
            SetPermissionCommand: The CDP command that sets permission.
        """
        params = SetPermissionParams(permission=permission, setting=setting)
        if origin is not None:
            params['origin'] = origin
        if browser_context_id is not None:
            params['browserContextId'] = browser_context_id
        return Command(method=BrowserMethod.SET_PERMISSION, params=params)

    @staticmethod
    def grant_permissions(
        permissions: list['PermissionType'],
        origin: Optional[str] = None,
        browser_context_id: Optional['BrowserContextID'] = None,
    ) -> GrantPermissionsCommand:
        """
        Grant specific permissions to the given origin and reject all others.

        Args:
            permissions: List of permissions to grant.
            origin: Origin the permission applies to, all origins if not specified.
            browser_context_id: BrowserContext to override permissions. When omitted,
                               default browser context is used.

        Returns:
            GrantPermissionsCommand: The CDP command that grants permissions.
        """
        params = GrantPermissionsParams(permissions=permissions)
        if origin is not None:
            params['origin'] = origin
        if browser_context_id is not None:
            params['browserContextId'] = browser_context_id
        return Command(method=BrowserMethod.GRANT_PERMISSIONS, params=params)

    @staticmethod
    def reset_permissions(
        browser_context_id: Optional['BrowserContextID'] = None,
    ) -> ResetPermissionsCommand:
        """
        Reset all permission management for all origins.

        Args:
            browser_context_id: BrowserContext to reset permissions. When omitted,
                               default browser context is used.

        Returns:
            ResetPermissionsCommand: The CDP command that resets permissions.
        """
        params = ResetPermissionsParams()
        if browser_context_id is not None:
            params['browserContextId'] = browser_context_id
        return Command(method=BrowserMethod.RESET_PERMISSIONS, params=params)

    @staticmethod
    def set_download_behavior(
        behavior: DownloadBehavior,
        browser_context_id: Optional['BrowserContextID'] = None,
        download_path: Optional[str] = None,
        events_enabled: bool = False,
    ) -> SetDownloadBehaviorCommand:
        """
        Set the behavior when downloading a file.

        Args:
            behavior: Whether to allow all or deny all download requests, or use default
                     Chrome behavior if available (otherwise deny). allowAndName allows
                     download and names files according to their download guids.
            browser_context_id: BrowserContext to set download behavior. When omitted,
                               default browser context is used.
            download_path: The default path to save downloaded files to. This is required
                          if behavior is set to 'allow' or 'allowAndName'.
            events_enabled: Whether to emit download events (defaults to false).

        Returns:
            SetDownloadBehaviorCommand: The CDP command that sets download behavior.
        """
        params = SetDownloadBehaviorParams(behavior=behavior)
        if browser_context_id is not None:
            params['browserContextId'] = browser_context_id
        if download_path is not None:
            params['downloadPath'] = download_path
        if events_enabled is not None:
            params['eventsEnabled'] = events_enabled
        return Command(method=BrowserMethod.SET_DOWNLOAD_BEHAVIOR, params=params)

    @staticmethod
    def cancel_download(
        guid: str,
        browser_context_id: Optional['BrowserContextID'] = None,
    ) -> CancelDownloadCommand:
        """
        Cancel a download if in progress.

        Args:
            guid: Global unique identifier of the download.
            browser_context_id: BrowserContext to perform the action in. When omitted,
                               default browser context is used.

        Returns:
            CancelDownloadCommand: The CDP command that cancels download.
        """
        params = CancelDownloadParams(guid=guid)
        if browser_context_id is not None:
            params['browserContextId'] = browser_context_id
        return Command(method=BrowserMethod.CANCEL_DOWNLOAD, params=params)

    @staticmethod
    def close() -> CloseCommand:
        """
        Close browser gracefully.

        Returns:
            CloseCommand: The CDP command that closes the browser.
        """
        return Command(method=BrowserMethod.CLOSE)

    @staticmethod
    def crash() -> CrashCommand:
        """
        Crashes browser on the main thread.

        Returns:
            CrashCommand: The CDP command that crashes the browser.
        """
        return Command(method=BrowserMethod.CRASH)

    @staticmethod
    def crash_gpu_process() -> CrashGpuProcessCommand:
        """
        Crashes GPU process.

        Returns:
            CrashGpuProcessCommand: The CDP command that crashes the GPU process.
        """
        return Command(method=BrowserMethod.CRASH_GPU_PROCESS)

    # Helper methods for common window operations
    @staticmethod
    def set_window_maximized(window_id: WindowID) -> SetWindowBoundsCommand:
        """
        Maximize a browser window.

        Args:
            window_id: Browser window id.

        Returns:
            SetWindowBoundsCommand: The CDP command that maximizes the window.
        """
        bounds = Bounds(windowState=WindowState.MAXIMIZED)
        return BrowserCommands.set_window_bounds(window_id, bounds)

    @staticmethod
    def set_window_minimized(window_id: WindowID) -> SetWindowBoundsCommand:
        """
        Minimize a browser window.

        Args:
            window_id: Browser window id.

        Returns:
            SetWindowBoundsCommand: The CDP command that minimizes the window.
        """
        bounds = Bounds(windowState=WindowState.MINIMIZED)
        return BrowserCommands.set_window_bounds(window_id, bounds)

    @staticmethod
    def set_window_fullscreen(window_id: WindowID) -> SetWindowBoundsCommand:
        """
        Set a browser window to fullscreen.

        Args:
            window_id: Browser window id.

        Returns:
            SetWindowBoundsCommand: The CDP command that sets window to fullscreen.
        """
        bounds = Bounds(windowState=WindowState.FULLSCREEN)
        return BrowserCommands.set_window_bounds(window_id, bounds)

    @staticmethod
    def set_window_normal(window_id: WindowID) -> SetWindowBoundsCommand:
        """
        Set a browser window to normal state.

        Args:
            window_id: Browser window id.

        Returns:
            SetWindowBoundsCommand: The CDP command that sets window to normal state.
        """
        bounds = Bounds(windowState=WindowState.NORMAL)
        return BrowserCommands.set_window_bounds(window_id, bounds)


================================================
FILE: pydoll/commands/dom_commands.py
================================================
from __future__ import annotations

from typing import TYPE_CHECKING, Optional

from pydoll.protocol.base import Command
from pydoll.protocol.dom.methods import (
    CollectClassNamesFromSubtreeParams,
    CopyToParams,
    DescribeNodeParams,
    DiscardSearchResultsParams,
    DomMethod,
    EnableParams,
    FocusParams,
    GetAnchorElementParams,
    GetAttributesParams,
    GetBoxModelParams,
    GetContainerForNodeParams,
    GetContentQuadsParams,
    GetDocumentParams,
    GetElementByRelationParams,
    GetFileInfoParams,
    GetFrameOwnerParams,
    GetNodeForLocationParams,
    GetNodesForSubtreeByStyleParams,
    GetNodeStackTracesParams,
    GetOuterHTMLParams,
    GetQueryingDescendantsForContainerParams,
    GetRelayoutBoundaryParams,
    GetSearchResultsParams,
    MoveToParams,
    PerformSearchParams,
    PushNodeByPathToFrontendParams,
    PushNodesByBackendIdsToFrontendParams,
    QuerySelectorAllParams,
    QuerySelectorParams,
    RemoveAttributeParams,
    RemoveNodeParams,
    RequestChildNodesParams,
    RequestNodeParams,
    ResolveNodeParams,
    ScrollIntoViewIfNeededParams,
    SetAttributesAsTextParams,
    SetAttributeValueParams,
    SetFileInputFilesParams,
    SetInspectedNodeParams,
    SetNodeNameParams,
    SetNodeStackTracesEnabledParams,
    SetNodeValueParams,
    SetOuterHTMLParams,
)

if TYPE_CHECKING:
    from pydoll.protocol.dom.methods import (
        CollectClassNamesFromSubtreeCommand,
        CopyToCommand,
        CSSComputedStyleProperty,
        DescribeNodeCommand,
        DisableCommand,
        DiscardSearchResultsCommand,
        EnableCommand,
        FocusCommand,
        GetAnchorElementCommand,
        GetAttributesCommand,
        GetBoxModelCommand,
        GetContainerForNodeCommand,
        GetContentQuadsCommand,
        GetDetachedDomNodesCommand,
        GetDocumentCommand,
        GetElementByRelationCommand,
        GetFileInfoCommand,
        GetFrameOwnerCommand,
        GetNodeForLocationCommand,
        GetNodesForSubtreeByStyleCommand,
        GetNodeStackTracesCommand,
        GetOuterHTMLCommand,
        GetQueryingDescendantsForContainerCommand,
        GetRelayoutBoundaryCommand,
        GetSearchResultsCommand,
        GetTopLayerElementsCommand,
        HideHighlightCommand,
        HighlightNodeCommand,
        HighlightRectCommand,
        MarkUndoableStateCommand,
        MoveToCommand,
        PerformSearchCommand,
        PushNodeByPathToFrontendCommand,
        PushNodesByBackendIdsToFrontendCommand,
        QuerySelectorAllCommand,
        QuerySelectorCommand,
        Rect,
        RedoCommand,
        RemoveAttributeCommand,
        RemoveNodeCommand,
        RequestChildNodesCommand,
        RequestNodeCommand,
        ResolveNodeCommand,
        ScrollIntoViewIfNeededCommand,
        SetAttributesAsTextCommand,
        SetAttributeValueCommand,
        SetFileInputFilesCommand,
        SetInspectedNodeCommand,
        SetNodeNameCommand,
        SetNodeStackTracesEnabledCommand,
        SetNodeValueCommand,
        SetOuterHTMLCommand,
        UndoCommand,
    )
    from pydoll.protocol.dom.types import (
        IncludeWhitespace,
        LogicalAxes,
        PhysicalAxes,
        RelationType,
    )


class DomCommands:
    """
    Implementation of Chrome DevTools Protocol for the DOM domain.

    This class provides commands for interacting with the Document Object Model (DOM) in the
    browser, enabling access and manipulation of the element structure in a web page.
    The DOM domain in Chrome DevTools Protocol exposes operations for reading and writing to the
    DOM, which is fundamental for browser automation, testing, and debugging.

    Each DOM element is represented by a mirror object with a unique ID. This ID can be used
    to gather additional information about the node, resolve it into JavaScript object wrappers,
    manipulate attributes, and perform various other operations on the DOM structure.
    """

    @staticmethod
    def describe_node(
        node_id: Optional[int] = None,
        backend_node_id: Optional[int] = None,
        object_id: Optional[str] = None,
        depth: Optional[int] = None,
        pierce: Optional[bool] = None,
    ) -> DescribeNodeCommand:
        """
        Describes a DOM node identified by its ID without requiring domain to be enabled.

        The describe_node command is particularly useful in scenarios where you need to quickly
        gather information about a specific element without subscribing to DOM change events,
        making it more lightweight for isolated element inspection operations.

        Args:
            node_id: Identifier of the node known to the client.
            backend_node_id: Identifier of the backend node used internally by the browser.
            object_id: JavaScript object id of the node wrapper.
            depth: Maximum depth at which children should be retrieved (default is 1).
                  Use -1 for the entire subtree or provide an integer greater than 0.
            pierce: Whether iframes and shadow roots should be traversed when returning
                   the subtree (default is false).

        Returns:
            Command: CDP command that returns detailed information about the requested node.
        """
        params = DescribeNodeParams()
        if node_id is not None:
            params['nodeId'] = node_id
        if backend_node_id is not None:
            params['backendNodeId'] = backend_node_id
        if object_id is not None:
            params['objectId'] = object_id
        if depth:
            params['depth'] = depth
        if pierce is not None:
            params['pierce'] = pierce
        return Command(method=DomMethod.DESCRIBE_NODE, params=params)

    @staticmethod
    def disable() -> DisableCommand:
        """
        Disables DOM agent for the current page.

        Disabling the DOM domain stops the CDP from sending DOM-related events and
        prevents further DOM manipulation operations until the domain is enabled again.
        This can be important for optimizing performance when you're done with DOM
        operations and want to minimize background processing.

        Returns:
            Command: CDP command to disable the DOM domain.
        """
        return Command(method=DomMethod.DISABLE)

    @staticmethod
    def enable(include_whitespace: Optional['IncludeWhitespace'] = None) -> EnableCommand:
        """
        Enables DOM agent for the current page.

        Enabling the DOM domain is a prerequisite for receiving DOM events and using most DOM
        manipulation methods. The DOM events include changes to the DOM tree structure,
        attribute modifications, and many others. Without enabling this domain first,
        many DOM operations would fail or provide incomplete information.

        Args:
            include_whitespace: Whether to include whitespace-only text nodes in the
                               children array of returned Nodes. Allowed values: "none", "all".

        Returns:
            Command: CDP command to enable the DOM domain.
        """
        params = EnableParams()
        if include_whitespace:
            params['includeWhitespace'] = include_whitespace
        return Command(method=DomMethod.ENABLE, params=params)

    @staticmethod
    def focus(
        node_id: Optional[int] = None,
        backend_node_id: Optional[int] = None,
        object_id: Optional[str] = None,
    ) -> FocusCommand:
        """
        Focuses the given element.

        The focus command is crucial for simulating realistic user interactions, as many
        events (like keyboard input) require that an element has focus first. It's also
        important for testing proper tab order and keyboard accessibility of web pages.

        Args:
            node_id: Identifier of the node to focus.
            backend_node_id: Identifier of the backend node to focus.
            object_id: JavaScript object id of the node wrapper.

        Returns:
            Command: CDP command to focus on the specified element.
        """
        params = FocusParams()
        if node_id:
            params['nodeId'] = node_id
        if backend_node_id:
            params['backendNodeId'] = backend_node_id
        if object_id:
            params['objectId'] = object_id
        return Command(method=DomMethod.FOCUS, params=params)

    @staticmethod
    def get_attributes(node_id: int) -> GetAttributesCommand:
        """
        Returns attributes for the specified node.

        Attribute information is essential in web testing and automation because attributes
        often contain crucial information about element state, behavior, and metadata.
        This command provides an efficient way to access all attributes of an element
        without parsing HTML or using JavaScript evaluation.

        Args:
            node_id: Id of the node to retrieve attributes for.

        Returns:
            Command: CDP command that returns an interleaved array of node attribute
                    names and values [name1, value1, name2, value2, ...].
        """
        params = GetAttributesParams(nodeId=node_id)
        return Command(method=DomMethod.GET_ATTRIBUTES, params=params)

    @staticmethod
    def get_box_model(
        node_id: Optional[int] = None,
        backend_node_id: Optional[int] = None,
        object_id: Optional[str] = None,
    ) -> GetBoxModelCommand:
        """
        Returns box model information for the specified node.

        The box model is a fundamental concept in CSS that describes how elements are
        rendered with content, padding, borders, and margins. This command provides
        detailed information about these dimensions and coordinates, which is invaluable
        for spatial analysis and precision interactions with elements on the page.

        Args:
            node_id: Identifier of the node.
            backend_node_id: Identifier of the backend node.
            object_id: JavaScript object id of the node wrapper.

        Returns:
            Command: CDP command that returns the box model for the node, including
                    coordinates for content, padding, border, and margin boxes.
        """
        params = GetBoxModelParams()
        if node_id is not None:
            params['nodeId'] = node_id
        if backend_node_id is not None:
            params['backendNodeId'] = backend_node_id
        if object_id is not None:
            params['objectId'] = object_id
        return Command(method=DomMethod.GET_BOX_MODEL, params=params)

    @staticmethod
    def get_document(
        depth: Optional[int] = None, pierce: Optional[bool] = None
    ) -> GetDocumentCommand:
        """
        Returns the root DOM node (and optionally the subtree) to the caller.

        This is typically the first command called when interacting with the DOM, as it
        provides access to the document's root node. From this root, you can traverse to
        any other element on the page. This command implicitly enables DOM domain events
        for the current target, making it a good starting point for DOM interaction.

        Args:
            depth: Maximum depth at which children should be retrieved (default is 1).
                  Use -1 for the entire subtree or provide an integer greater than 0.
            pierce: Whether iframes and shadow roots should be traversed when returning
                  the subtree (default is false).

        Returns:
            Command: CDP command that returns the root DOM node.
        """
        params = GetDocumentParams()
        if depth is not None:
            params['depth'] = depth
        if pierce is not None:
            params['pierce'] = pierce
        return Command(method=DomMethod.GET_DOCUMENT, params=params)

    @staticmethod
    def get_node_for_location(
        x: int,
        y: int,
        include_user_agent_shadow_dom: Optional[bool] = None,
        ignore_pointer_events_none: Optional[bool] = None,
    ) -> GetNodeForLocationCommand:
        """
        Returns node id at given location on the page.

        This command is particularly useful for bridging the gap between visual/pixel-based
        information and the DOM structure. It allows you to convert screen coordinates to
        actual DOM elements, which is essential for creating inspection tools or for testing
        spatially-oriented interactions.

        Args:
            x: X coordinate relative to the main frame's viewport.
            y: Y coordinate relative to the main frame's viewport.
            include_user_agent_shadow_dom: Whether to include nodes in user agent shadow roots.
            ignore_pointer_events_none: Whether to ignore pointer-events:none and test elements
                                       underneath them.

        Returns:
            Command: CDP command that returns the node at the given location, including
                   frame information when available.
        """
        params = GetNodeForLocationParams(x=x, y=y)
        if include_user_agent_shadow_dom is not None:
            params['includeUserAgentShadowDOM'] = include_user_agent_shadow_dom
        if ignore_pointer_events_none is not None:
            params['ignorePointerEventsNone'] = ignore_pointer_events_none
        return Command(method=DomMethod.GET_NODE_FOR_LOCATION, params=params)

    @staticmethod
    def get_outer_html(
        node_id: Optional[int] = None,
        backend_node_id: Optional[int] = None,
        object_id: Optional[str] = None,
    ) -> GetOuterHTMLCommand:
        """
        Returns node's HTML markup, including the node itself and all its children.

        This command provides a way to access the complete HTML representation of an
        element, making it valuable for when you need to extract, analyze, or verify
        HTML content. It's more comprehensive than just getting text content as it
        preserves the full markup structure including tags, attributes, and child elements.

        Args:
            node_id: Identifier of the node.
            backend_node_id: Identifier of the backend node.
            object_id: JavaScript object id of the node wrapper.

        Returns:
            Command: CDP command that returns the outer HTML markup of the node.
        """
        params = GetOuterHTMLParams()
        if node_id is not None:
            params['nodeId'] = node_id
        if backend_node_id is not None:
            params['backendNodeId'] = backend_node_id
        if object_id is not None:
            params['objectId'] = object_id
        return Command(method=DomMethod.GET_OUTER_HTML, params=params)

    @staticmethod
    def hide_highlight() -> HideHighlightCommand:
        """
        Hides any DOM element highlight.

        This command is particularly useful in automation workflows where multiple elements
        are highlighted in sequence, and you need to clear previous highlights before
        proceeding to the next element to avoid visual clutter or interference.

        Returns:
            Command: CDP command to hide DOM element highlights.
        """
        return Command(method=DomMethod.HIDE_HIGHLIGHT)

    @staticmethod
    def highlight_node() -> HighlightNodeCommand:
        """
        Highlights DOM node.

        Highlighting nodes is especially valuable during development and debugging sessions
        to visually confirm which elements are being selected by selectors or coordinates.

        Returns:
            Command: CDP command to highlight a DOM node.
        """
        return Command(method=DomMethod.HIGHLIGHT_NODE)

    @staticmethod
    def highlight_rect() -> HighlightRectCommand:
        """
        Highlights given rectangle.

        Unlike node highlighting, rectangle highlighting allows highlighting arbitrary
        regions of the page, which is useful for highlighting computed areas or
        regions that don't correspond directly to DOM elements.

        Returns:
            Command: CDP command to highlight a rectangular area.
        """
        return Command(method=DomMethod.HIGHLIGHT_RECT)

    @staticmethod
    def move_to(
        node_id: int,
        target_node_id: int,
        insert_before_node_id: Optional[int] = None,
    ) -> MoveToCommand:
        """
        Moves node into the new container, placing it before the given anchor.

        This command allows for more complex DOM restructuring than simple attribute or
        content changes. It's particularly useful when testing applications that involve
        rearranging elements, such as sortable lists, kanban boards, or drag-and-drop interfaces.

        Args:
            node_id: Id of the node to move.
            target_node_id: Id of the element to drop the moved node into.
            insert_before_node_id: Drop node before this one (if absent, the moved node
                                 becomes the last child of target_node_id).

        Returns:
            Command: CDP command to move a node, returning the new id of the moved node.
        """
        params = MoveToParams(nodeId=node_id, targetNodeId=target_node_id)
        if insert_before_node_id is not None:
            params['insertBeforeNodeId'] = insert_before_node_id
        return Command(method=DomMethod.MOVE_TO, params=params)

    @staticmethod
    def query_selector(
        node_id: int,
        selector: str,
    ) -> QuerySelectorCommand:
        """
        Executes querySelector on a given node.

        This method is one of the most fundamental tools for element location, allowing
        the use of standard CSS selectors to find elements in the DOM. Unlike JavaScript's
        querySelector, this can be executed on any node (not just document), enabling
        scoped searches within specific sections of the page.

        Args:
            node_id: Id of the node to query upon.
            selector: CSS selector string.

        Returns:
            Command: CDP command that returns the first element matching the selector.
        """
        params = QuerySelectorParams(nodeId=node_id, selector=selector)
        return Command(method=DomMethod.QUERY_SELECTOR, params=params)

    @staticmethod
    def query_selector_all(
        node_id: int,
        selector: str,
    ) -> QuerySelectorAllCommand:
        """
        Executes querySelectorAll on a given node.

        This method extends querySelector by returning all matching elements rather than just
        the first one. This is essential for operations that need to process multiple elements,
        such as extracting data from tables, lists, or grids, or verifying that the correct
        number of elements are present.

        Args:
            node_id: Id of the node to query upon.
            selector: CSS selector string.

        Returns:
            Command: CDP command that returns all elements matching the selector.
        """
        params = QuerySelectorAllParams(nodeId=node_id, selector=selector)
        return Command(method=DomMethod.QUERY_SELECTOR_ALL, params=params)

    @staticmethod
    def remove_attribute(
        node_id: int,
        name: str,
    ) -> RemoveAttributeCommand:
        """
        Removes attribute with given name from an element with given id.

        This command allows direct manipulation of element attributes without using JavaScript
        in the page context. It's useful for testing how elements behave when specific
        attributes are removed or for preparing elements for specific test conditions.

        Args:
            node_id: Id of the element to remove attribute from.
            name: Name of the attribute to remove.

        Returns:
            Command: CDP command to remove the specified attribute.
        """
        params = RemoveAttributeParams(nodeId=node_id, name=name)
        return Command(method=DomMethod.REMOVE_ATTRIBUTE, params=params)

    @staticmethod
    def remove_node(node_id: int) -> RemoveNodeCommand:
        """
        Removes node with given id.

        This command allows direct removal of DOM elements, which can be useful when
        testing how an application responds to missing elements or when simplifying
        a page for focused testing scenarios.

        Args:
            node_id: Id of the node to remove.

        Returns:
            Command: CDP command to remove the specified node.
        """
        params = RemoveNodeParams(nodeId=node_id)
        return Command(method=DomMethod.REMOVE_NODE, params=params)

    @staticmethod
    def request_child_nodes(
        node_id: int,
        depth: Optional[int] = None,
        pierce: Optional[bool] = None,
    ) -> RequestChildNodesCommand:
        """
        Requests that children of the node with given id are returned to the caller.

        This method is particularly useful when dealing with large DOM trees, as it allows
        for more efficient exploration by loading children on demand rather than loading
        the entire tree at once. Child nodes are returned as setChildNodes events.

        Args:
            node_id: Id of the node to get children for.
            depth: The maximum depth at which children should be retrieved,
                  defaults to 1. Use -1 for the entire subtree.
            pierce: Whether or not iframes and shadow roots should be traversed.

        Returns:
            Command: CDP command to request child nodes.
        """
        params = RequestChildNodesParams(nodeId=node_id)
        if depth is not None:
            params['depth'] = depth
        if pierce is not None:
            params['pierce'] = pierce
        return Command(method=DomMethod.REQUEST_CHILD_NODES, params=params)

    @staticmethod
    def request_node(
        object_id: str,
    ) -> RequestNodeCommand:
        """
        Requests that the node is sent to the caller given the JavaScript node object reference.

        This method bridges the gap between JavaScript objects in the page context and the
        CDP's node representation system, allowing automation to work with elements that
        might only be available as JavaScript references (e.g., from event handlers).

        Args:
            object_id: JavaScript object id to convert into a Node.

        Returns:
            Command: CDP command that returns the Node id for the given object.
        """
        params = RequestNodeParams(objectId=object_id)
        return Command(method=DomMethod.REQUEST_NODE, params=params)

    @staticmethod
    def resolve_node(
        node_id: Optional[int] = None,
        backend_node_id: Optional[int] = None,
        object_group: Optional[str] = None,
        execution_context_id: Optional[int] = None,
    ) -> ResolveNodeCommand:
        """
        Resolves the JavaScript node object for a given NodeId or BackendNodeId.

        This method provides the opposite functionality of requestNode - instead of getting
        a CDP node from a JavaScript object, it gets a JavaScript object from a CDP node.
        This enables executing JavaScript operations on nodes identified through CDP.

        Args:
            node_id: Id of the node to resolve.
            backend_node_id: Backend id of the node to resolve.
            object_group: Symbolic group name that can be used to release multiple objects.
            execution_context_id: Execution context in which to resolve the node.

        Returns:
            Command: CDP command that returns a JavaScript object wrapper for the node.
        """
        params = ResolveNodeParams()
        if node_id is not None:
            params['nodeId'] = node_id
        if backend_node_id is not None:
            params['backendNodeId'] = backend_node_id
        if object_group is not None:
            params['objectGroup'] = object_group
        if execution_context_id is not None:
            params['executionContextId'] = execution_context_id
        return Command(method=DomMethod.RESOLVE_NODE, params=params)

    @staticmethod
    def scroll_into_view_if_needed(
        node_id: Optional[int] = None,
        backend_node_id: Optional[int] = None,
        object_id: Optional[str] = None,
        rect: Optional[Rect] = None,
    ) -> ScrollIntoViewIfNeededCommand:
        """
        Scrolls the specified node into view if not already visible.

        This command is crucial for reliable web automation, as it ensures elements
        are actually visible in the viewport before attempting interactions. Modern
        websites often use lazy loading and have long scrollable areas, making this
        command essential for working with elements that may not be initially visible.

        Args:
            node_id: Identifier of the node.
            backend_node_id: Identifier of the backend node.
            object_id: JavaScript object id of the node wrapper.
            rect: Optional rect to scroll into view, relative to the node bounds.

        Returns:
            Command: CDP command to scroll the element into view.
        """
        params = ScrollIntoViewIfNeededParams()
        if node_id is not None:
            params['nodeId'] = node_id
        if backend_node_id is not None:
            params['backendNodeId'] = backend_node_id
        if object_id is not None:
            params['objectId'] = object_id
        if rect is not None:
            params['rect'] = rect
        return Command(method=DomMethod.SCROLL_INTO_VIEW_IF_NEEDED, params=params)

    @staticmethod
    def set_attributes_as_text(
        node_id: int,
        text: str,
        name: Optional[str] = None,
    ) -> SetAttributesAsTextCommand:
        """
        Sets attribute for an element with given id, using text representation.

        This command allows for more complex attribute manipulation than set_attribute_value,
        as it accepts a text representation that can potentially define multiple attributes
        or include special formatting. It's particularly useful when trying to replicate
        exactly how attributes would be defined in HTML source code.

        Args:
            node_id: Id of the element to set attribute for.
            text: Text with a new attribute value.
            name: Attribute name to replace with new text value.

        Returns:
            Command: CDP command to set an attribute as text.
        """
        params = SetAttributesAsTextParams(nodeId=node_id, text=text)
        if name is not None:
            params['name'] = name
        return Command(method=DomMethod.SET_ATTRIBUTES_AS_TEXT, params=params)

    @staticmethod
    def set_attribute_value(
        node_id: int,
        name: str,
        value: str,
    ) -> SetAttributeValueCommand:
        """
        Sets attribute for element with given id.

        This command provides direct control over element attributes without using JavaScript,
        which is essential for testing how applications respond to attribute changes or for
        setting up specific test conditions by controlling element attributes directly.

        Args:
            node_id: Id of the element to set attribute for.
            name: Attribute name.
            value: Attribute value.

        Returns:
            Command: CDP command to set an attribute value.
        """
        params = SetAttributeValueParams(nodeId=node_id, name=name, value=value)
        return Command(method=DomMethod.SET_ATTRIBUTE_VALUE, params=params)

    @staticmethod
    def set_file_input_files(
        files: list[str],
        node_id: Optional[int] = None,
        backend_node_id: Optional[int] = None,
        object_id: Optional[str] = None,
    ) -> SetFileInputFilesCommand:
        """
        Sets files for the given file input element.

        This command solves one of the most challenging automation problems: working with
        file inputs. It bypasses the OS-level file dialog that normally appears when clicking
        a file input, allowing automated tests to provide files programmatically.

        Args:
            files: list of file paths to set.
            node_id: Identifier of the node.
            backend_node_id: Identifier of the backend node.
            object_id: JavaScript object id of the node wrapper.

        Returns:
            Command: CDP command to set files for a file input element.
        """
        params = SetFileInputFilesParams(files=files)
        if node_id is not None:
            params['nodeId'] = node_id
        if backend_node_id is not None:
            params['backendNodeId'] = backend_node_id
        if object_id is not None:
            params['objectId'] = object_id
        return Command(method=DomMethod.SET_FILE_INPUT_FILES, params=params)

    @staticmethod
    def set_node_name(
        node_id: int,
        name: str,
    ) -> SetNodeNameCommand:
        """
        Sets node name for a node with given id.

        This command allows changing the actual tag name of an element, which can be useful
        for testing how applications handle different types of elements or for testing the
        impact of semantic HTML choices on accessibility and behavior.

        Args:
            node_id: Id of the node to set name for.
            name: New node name.

        Returns:
            Command: CDP command that returns the new node id after the name change.
        """
        params = SetNodeNameParams(nodeId=node_id, name=name)
        return Command(method=DomMethod.SET_NODE_NAME, params=params)

    @staticmethod
    def set_node_value(
        node_id: int,
        value: str,
    ) -> SetNodeValueCommand:
        """
        Sets node value for a node with given id.

        This command is particularly useful for updating the content of text nodes and
        comments, allowing direct manipulation of text content without changing the
        surrounding HTML structure.

        Args:
            node_id: Id of the node to set value for.
            value: New node value.

        Returns:
            Command: CDP command to set a node's value.
        """
        params = SetNodeValueParams(nodeId=node_id, value=value)
        return Command(method=DomMethod.SET_NODE_VALUE, params=params)

    @staticmethod
    def set_outer_html(
        node_id: int,
        outer_html: str,
    ) -> SetOuterHTMLCommand:
        """
        Sets node HTML markup, replacing existing one.

        This is one of the most powerful DOM manipulation commands, as it allows completely
        replacing an element and all its children with new HTML. This is useful for making
        major structural changes to the page or for testing how applications handle
        dynamically inserted content.

        Args:
            node_id: Id of the node to set outer HTML for.
            outer_html: HTML markup to set.

        Returns:
            Command: CDP command to set the outer HTML of a node.
        """
        params = SetOuterHTMLParams(nodeId=node_id, outerHTML=outer_html)
        return Command(method=DomMethod.SET_OUTER_HTML, params=params)

    @staticmethod
    def collect_class_names_from_subtree(
        node_id: int,
    ) -> CollectClassNamesFromSubtreeCommand:
        """
        Collects class names for the node with given id and all of its children.

        This method is valuable for understanding the styling landscape of a page,
        especially in complex applications where multiple CSS frameworks might be
        in use or where classes are dynamically applied.

        Args:
            node_id: Id of the node to collect class names for.

        Returns:
            Command: CDP command that returns a list of all unique class names in the subtree.
        """
        params = CollectClassNamesFromSubtreeParams(nodeId=node_id)
        return Command(method=DomMethod.COLLECT_CLASS_NAMES_FROM_SUBTREE, params=params)

    @staticmethod
    def copy_to(
        node_id: int,
        target_node_id: int,
        insert_before_node_id: Optional[int] = None,
    ) -> CopyToCommand:
        """
        Creates a deep copy of the specified node and places it into the target container.

        Unlike move_to, this command creates a copy of the node, leaving the original intact.
        This is useful when you want to duplicate content rather than move it, such as when
        testing how multiple instances of the same component behave.

        Args:
            node_id: Id of the node to copy.
            target_node_id: Id of the element to drop the copy into.
            insert_before_node_id: Drop the copy before this node (if absent, the copy becomes
                                 the last child of target_node_id).

        Returns:
            Command: CDP command that returns the id of the new copy.
        """
        params = CopyToParams(nodeId=node_id, targetNodeId=target_node_id)
        if insert_before_node_id is not None:
            params['insertBeforeNodeId'] = insert_before_node_id
        return Command(method=DomMethod.COPY_TO, params=params)

    @staticmethod
    def discard_search_results(
        search_id: str,
    ) -> DiscardSearchResultsCommand:
        """
        Discards search results from the session with the given id.

        This method helps manage resources when performing multiple searches during
        a session, allowing explicit cleanup of search results that are no longer needed.

        Args:
            search_id: Unique search session identifier.

        Returns:
            Command: CDP command to discard search results.
        """
        params = DiscardSearchResultsParams(searchId=search_id)
        return Command(method=DomMethod.DISCARD_SEARCH_RESULTS, params=params)

    @staticmethod
    def get_anchor_element(
        node_id: int,
        anchor_specifier: Optional[str] = None,
    ) -> GetAnchorElementCommand:
        """
        Finds the closest ancestor node that is an anchor element for the given node.

        This method is useful when working with content inside links or when you need to
        find the enclosing link element for text or other elements. This helps in cases
        where you might locate text but need to find the actual link around it.

        Args:
            node_id: Id of the node to search for an anchor around.
            anchor_specifier: Optional specifier for anchor tag properties.

        Returns:
            Command: CDP command that returns the anchor element node information.
        """
        params = GetAnchorElementParams(nodeId=node_id)
        if anchor_specifier is not None:
            params['anchorSpecifier'] = anchor_specifier
        return Command(method=DomMethod.GET_ANCHOR_ELEMENT, params=params)

    @staticmethod
    def get_container_for_node(
        node_id: int,
        container_name: Optional[str] = None,
        physical_axes: Optional['PhysicalAxes'] = None,
        logical_axes: Optional['LogicalAxes'] = None,
        queries_scroll_state: Optional[bool] = None,
    ) -> GetContainerForNodeCommand:
        """
        Finds a containing element for the given node based on specified parameters.

        This method helps in understanding the structural and layout context of elements,
        particularly in complex layouts using CSS features like flexbox, grid, or when
        dealing with scrollable containers.

        Args:
            node_id: Id of the node to find the container for.
            container_name: Name of the container to look for (e.g., 'scrollable', 'flex').
            physical_axes: Physical axes to consider (Horizontal, Vertical, Both).
            logical_axes: Logical axes to consider (Inline, Block, Both).
            queries_scroll_state: Whether to query scroll state or not.

        Returns:
            Command: CDP command that returns information about the containing element.
        """
        params = GetContainerForNodeParams(nodeId=node_id)
        if container_name is not None:
            params['containerName'] = container_name
        if physical_axes is not None:
            params['physicalAxes'] = physical_axes
        if logical_axes is not None:
            params['logicalAxes'] = logical_axes
        if queries_scroll_state is not None:
            params['queriesScrollState'] = queries_scroll_state
        return Command(method=DomMethod.GET_CONTAINER_FOR_NODE, params=params)

    @staticmethod
    def get_content_quads(
        node_id: Optional[int] = None,
        backend_node_id: Optional[int] = None,
        object_id: Optional[str] = None,
    ) -> GetContentQuadsCommand:
        """
        Returns quads that describe node position on the page.

        This method provides detailed geometric information about an element's position
        on the page, accounting for any transformations, rotations, or other CSS effects.
        This is more precise than getBoxModel for complex layouts.

        Args:
            node_id: Identifier of the node.
            backend_node_id: Identifier of the backend node.
            object_id: JavaScript object id of the node wrapper.

        Returns:
            Command: CDP command that returns the quads describing the node position.
        """
        params = GetContentQuadsParams()
        if node_id is not None:
            params['nodeId'] = node_id
        if backend_node_id is not None:
            params['backendNodeId'] = backend_node_id
        if object_id is not None:
            params['objectId'] = object_id
        return Command(method=DomMethod.GET_CONTENT_QUADS, params=params)

    @staticmethod
    def get_detached_dom_nodes() -> GetDetachedDomNodesCommand:
        """
        Returns information about detached DOM tree elements.

        This method is primarily useful for debugging memory issues related to the DOM,
        as detached DOM nodes (nodes no longer in the document but still referenced in
        JavaScript) are a common cause of memory leaks in web applications.

        Returns:
            Command: CDP command that returns information about detached DOM nodes.
        """
        return Command(method=DomMethod.GET_DETACHED_DOM_NODES)

    @staticmethod
    def get_element_by_relation(
        node_id: int,
        relation: RelationType,
    ) -> GetElementByRelationCommand:
        """
        Retrieves an element related to the given one in a specified way.

        This method provides a way to find elements based on their relationships to other
        elements, such as finding the next focusable element after a given one. This is
        useful for simulating keyboard navigation or for analyzing element relationships.

        Args:
            node_id: Id of the reference node.
            relation: Type of relationship (e.g., nextSibling, previousSibling, firstChild).

        Returns:
            Command: CDP command that returns the related element node.
        """
        params = GetElementByRelationParams(nodeId=node_id, relation=relation)
        return Command(method=DomMethod.GET_ELEMENT_BY_RELATION, params=params)

    @staticmethod
    def get_file_info(
        object_id: str,
    ) -> GetFileInfoCommand:
        """
        Returns file information for the given File object.

        This method is useful when working with file inputs and the File API, providing
        access to file metadata like name, size, and MIME type for files selected in
        file input elements or created programmatically.

        Args:
            object_id: JavaScript object id of the File object to get info for.

        Returns:
            Command: CDP command that returns file information.
        """
        params = GetFileInfoParams(objectId=object_id)
        return Command(method=DomMethod.GET_FILE_INFO, params=params)

    @staticmethod
    def get_frame_owner(
        frame_id: str,
    ) -> GetFrameOwnerCommand:
        """
        Returns iframe element that owns the given frame.

        This method is essential when working with pages that contain iframes, as it
        allows mapping between frame IDs (used in CDP) and the actual iframe elements
        in the parent document.

        Args:
            frame_id: Id of the frame to get the owner element for.

        Returns:
            Command: CDP command that returns the frame owner element.
        """
        params = GetFrameOwnerParams(frameId=frame_id)
        return Command(method=DomMethod.GET_FRAME_OWNER, params=params)

    @staticmethod
    def get_nodes_for_subtree_by_style(
        node_id: int,
        computed_styles: list[CSSComputedStyleProperty],
        pierce: Optional[bool] = None,
    ) -> GetNodesForSubtreeByStyleCommand:
        """
        Finds nodes with a given computed style in a subtree.

        This method allows finding elements based on their computed styles rather than just
        structure or attributes. This is powerful for testing visual aspects of a page or
        for finding elements that match specific visual criteria.

        Args:
            node_id: Node to start the search from.
            computed_styles: list of computed style properties to match against.
            pierce: Whether or not iframes and shadow roots should be traversed.

        Returns:
            Command: CDP command that returns nodes matching the specified styles.
        """
        params = GetNodesForSubtreeByStyleParams(nodeId=node_id, computedStyles=computed_styles)
        if pierce is not None:
            params['pierce'] = pierce
        return Command(method=DomMethod.GET_NODES_FOR_SUBTREE_BY_STYLE, params=params)

    @staticmethod
    def get_node_stack_traces(
        node_id: int,
    ) -> GetNodeStackTracesCommand:
        """
        Gets stack traces associated with a specific node.

        This method is powerful for debugging, as it reveals the JavaScript execution paths
        that led to the creation of specific DOM elements, helping developers understand
        the relationship between their code and the resulting DOM structure.

        Args:
            node_id: Id of the node to get stack traces for.

        Returns:
            Command: CDP command that returns stack traces related to the node.
        """
        params = GetNodeStackTracesParams(nodeId=node_id)
        return Command(method=DomMethod.GET_NODE_STACK_TRACES, params=params)

    @staticmethod
    def get_querying_descendants_for_container(
        node_id: int,
    ) -> GetQueryingDescendantsForContainerCommand:
        """
        Returns the querying descendants for container.

        This method is particularly useful for working with CSS Container Queries, helping
        to identify which descendant elements are affected by or querying a particular
        container element.

        Args:
            node_id: Id of the container node to find querying descendants for.

        Returns:
            Command: CDP command that returns querying descendant information.
        """
        params = GetQueryingDescendantsForContainerParams(nodeId=node_id)
        return Command(method=DomMethod.GET_QUERYING_DESCENDANTS_FOR_CONTAINER, params=params)

    @staticmethod
    def get_relayout_boundary(
        node_id: int,
    ) -> GetRelayoutBoundaryCommand:
        """
        Returns the root of the relayout boundary for the given node.

        This method helps in understanding layout performance by identifying the boundary
        of layout recalculations when a particular element changes. This is valuable for
        optimizing rendering performance.

        Args:
            node_id: Id of the node to find relayout boundary for.

        Returns:
            Command: CDP command that returns the relayout boundary node.
        """
        params = GetRelayoutBoundaryParams(nodeId=node_id)
        return Command(method=DomMethod.GET_RELAYOUT_BOUNDARY, params=params)

    @staticmethod
    def get_search_results(
        search_id: str,
        from_index: int,
        to_index: int,
    ) -> GetSearchResultsCommand:
        """
        Returns search results from given `fromIndex` to given `toIndex` from a search.

        This method is used in conjunction with performSearch to retrieve search results
        in batches, which is essential when dealing with large result sets that might
        be inefficient to transfer all at once.

        Args:
            search_id: Unique search session identifier from performSearch.
            from_index: Start index to retrieve results from.
            to_index: End index to retrieve results to (exclusive).

        Returns:
            Command: CDP command that returns the requested search results.
        """
        params = GetSearchResultsParams(searchId=search_id, fromIndex=from_index, toIndex=to_index)
        return Command(method=DomMethod.GET_SEARCH_RESULTS, params=params)

    @staticmethod
    def get_top_layer_elements() -> GetTopLayerElementsCommand:
        """
        Returns all top layer elements in the document.

        This method is valuable for working with modern web UIs that make extensive use
        of overlays, modals, dropdowns, and other elements that need to appear above
        the normal document flow.

        Returns:
            Command: CDP command that returns the top layer element information.
        """
        return Command(method=DomMethod.GET_TOP_LAYER_ELEMENTS)

    @staticmethod
    def mark_undoable_state() -> MarkUndoableStateCommand:
        """
        Marks last undoable state.

        This method helps in managing DOM manipulation state, allowing the creation of
        savepoints that can be reverted to with the undo command. This is useful for
        complex sequences of DOM operations that should be treated as a unit.

        Returns:
            Command: CDP command to mark the current state as undoable.
        """
        return Command(method=DomMethod.MARK_UNDOABLE_STATE)

    @staticmethod
    def perform_search(
        query: str,
        include_user_agent_shadow_dom: Optional[bool] = None,
    ) -> PerformSearchCommand:
        """
        Searches for a given string in the DOM tree.

        This method initiates a search across the DOM tree, supporting plain text,
        CSS selectors, or XPath expressions. It's a powerful way to find elements
        or content across the entire document without knowing the exact structure.

        Args:
            query: Plain text or query selector or XPath search query.
            include_user_agent_shadow_dom: True to include user agent shadow DOM in the search.

        Returns:
            Command: CDP command that returns search results identifier and count.
        """
        params = PerformSearchParams(query=query)
        if include_user_agent_shadow_dom is not None:
            params['includeUserAgentShadowDOM'] = include_user_agent_shadow_dom
        return Command(method=DomMethod.PERFORM_SEARCH, params=params)

    @staticmethod
    def push_node_by_path_to_frontend(
        path: str,
    ) -> PushNodeByPathToFrontendCommand:
        """
        Requests that the node is sent to the caller given its path.

        This method provides an alternative way to reference nodes when node IDs aren't
        available, using path expressions instead. This can be useful when integrating
        with systems that identify elements by path rather than by ID.

        Args:
            path: Path to node in the proprietary format.

        Returns:
            Command: CDP command that returns the node id for the node.
        """
        params = PushNodeByPathToFrontendParams(path=path)
        return Command(method=DomMethod.PUSH_NODE_BY_PATH_TO_FRONTEND, params=params)

    @staticmethod
    def push_nodes_by_backend_ids_to_frontend(
        backend_node_ids: list[int],
    ) -> PushNodesByBackendIdsToFrontendCommand:
        """
        Requests that a batch of nodes is sent to the caller given their backend node ids.

        This method allows for efficient batch processing when you have multiple backend
        node IDs and need to convert them to frontend node IDs for further operations.

        Args:
            backend_node_ids: The array of backend node ids.

        Returns:
            Command: CDP command that returns an array of node ids.
        """
        params = PushNodesByBackendIdsToFrontendParams(backendNodeIds=backend_node_ids)
        return Command(method=DomMethod.PUSH_NODES_BY_BACKEND_IDS_TO_FRONTEND, params=params)

    @staticmethod
    def redo() -> RedoCommand:
        """
        Re-does the last undone action.

        This method works in conjunction with undo and markUndoableState to provide
        a transactional approach to DOM manipulations, allowing for stepping back and
        forth through a sequence of changes.

        Returns:
            Command: CDP command to redo the last undone action.
        """
        return Command(method=DomMethod.REDO)

    @staticmethod
    def set_inspected_node(
        node_id: int,
    ) -> SetInspectedNodeCommand:
        """
        Enables console to refer to the node with given id via $x command line API.

        This method creates a bridge between automated testing/scripting and manual console
        interaction, making it easy to reference specific nodes in the console for
        debugging or experimentation.

        Args:
            node_id: DOM node id to be accessible by means of $x command line API.

        Returns:
            Command: CDP command to set the inspected node.
        """
        params = SetInspectedNodeParams(nodeId=node_id)
        return Command(method=DomMethod.SET_INSPECTED_NODE, params=params)

    @staticmethod
    def set_node_stack_traces_enabled(
        enable: bool,
    ) -> SetNodeStackTracesEnabledCommand:
        """
        Sets if stack traces should be captured for Nodes.

        This method enables or disables the collection of stack traces when DOM nodes
        are created, which can be extremely valuable for debugging complex applications
        to understand where and why specific DOM elements are being created.

        Args:
            enable: Enable or disable stack trace collection.

        Returns:
            Command: CDP command to enable or disable node stack traces.
        """
        params = SetNodeStackTracesEnabledParams(enable=enable)
        return Command(method=DomMethod.SET_NODE_STACK_TRACES_ENABLED, params=params)

    @staticmethod
    def undo() -> UndoCommand:
        """
        Undoes the last performed action.

        This method works in conjunction with redo and markUndoableState to provide
        transactional control over DOM manipulations, allowing for reverting changes
        when needed.

        Returns:
            Command: CDP command to undo the last performed action.
        """
        return Command(method=DomMethod.UNDO)


================================================
FILE: pydoll/commands/emulation_commands.py
================================================
from __future__ import annotations

from typing import TYPE_CHECKING, Optional

from pydoll.protocol.base import Command
from pydoll.protocol.emulation.methods import (
    EmulationMethod,
    SetUserAgentOverrideParams,
)

if TYPE_CHECKING:
    from pydoll.protocol.emulation.methods import SetUserAgentOverrideCommand
    from pydoll.protocol.emulation.types import UserAgentMetadata


class EmulationCommands:
    """
    Implementation of Chrome DevTools Protocol for the Emulation domain.

    This class provides commands for emulating different environments,
    including user agent overrides, device metrics, and other browser
    characteristics useful for testing and automation.

    See https://chromedevtools.github.io/devtools-protocol/tot/Emulation/
    """

    @staticmethod
    def set_user_agent_override(
        user_agent: str,
        accept_language: Optional[str] = None,
        platform: Optional[str] = None,
        user_agent_metadata: Optional[UserAgentMetadata] = None,
    ) -> SetUserAgentOverrideCommand:
        """
        Overrides the browser's User-Agent string via the Emulation domain.

        This is the canonical CDP method for User-Agent override. It modifies
        both HTTP headers and navigator JavaScript properties, ensuring
        consistency between all layers.

        When userAgentMetadata is provided, Client Hint headers (Sec-CH-UA-*)
        will also be sent consistently with the overridden User-Agent.

        Args:
            user_agent: Complete User-Agent string to use.
            accept_language: Browser language preference (e.g., 'en-US,en;q=0.9').
            platform: Value for navigator.platform (e.g., 'Win32', 'MacIntel').
            user_agent_metadata: Client Hints metadata for Sec-CH-UA-* headers
                and navigator.userAgentData.

        Returns:
            SetUserAgentOverrideCommand: CDP command to override user agent.
        """
        params = SetUserAgentOverrideParams(userAgent=user_agent)
        if accept_language is not None:
            params['acceptLanguage'] = accept_language
        if platform is not None:
            params['platform'] = platform
        if user_agent_metadata is not None:
            params['userAgentMetadata'] = user_agent_metadata
        return Command(method=EmulationMethod.SET_USER_AGENT_OVERRIDE, params=params)


================================================
FILE: pydoll/commands/fetch_commands.py
================================================
from __future__ import annotations

from typing import TYPE_CHECKING, Optional

from pydoll.protocol.base import Command
from pydoll.protocol.fetch.methods import (
    AuthChallengeResponse,
    ContinueRequestParams,
    ContinueResponseParams,
    ContinueWithAuthParams,
    EnableParams,
    FailRequestParams,
    FetchMethod,
    FulfillRequestParams,
    GetResponseBodyParams,
    TakeResponseBodyAsStreamParams,
)
from pydoll.protocol.fetch.types import RequestPattern

if TYPE_CHECKING:
    from pydoll.protocol.fetch.methods import (
        ContinueRequestCommand,
        ContinueResponseCommand,
        ContinueWithAuthCommand,
        DisableCommand,
        EnableCommand,
        FailRequestCommand,
        FulfillRequestCommand,
        GetResponseBodyCommand,
        TakeResponseBodyAsStreamCommand,
    )
    from pydoll.protocol.fetch.types import (
        AuthChallengeResponseType,
        HeaderEntry,
        RequestStage,
        ResourceType,
    )
    from pydoll.protocol.network.types import ErrorReason, RequestMethod


class FetchCommands:
    """
    This class encapsulates the fetch commands of the Chrome DevTools Protocol (CDP).

    CDP's Fetch domain allows interception and modification of network requests
    at the application layer. This enables developers to examine, modify, and
    control network traffic, which is particularly useful for testing, debugging,
    and advanced automation scenarios.

    The commands defined in this class provide functionality for:
    - Enabling and disabling fetch request interception
    - Continuing, fulfilling, or failing intercepted requests
    - Handling authentication challenges
    - Retrieving and modifying response bodies
    - Processing response data as streams
    """

    @staticmethod
    def continue_request(
        request_id: str,
        url: Optional[str] = None,
        method: Optional['RequestMethod'] = None,
        post_data: Optional[str] = None,
        headers: Optional[list['HeaderEntry']] = None,
        intercept_response: Optional[bool] = None,
    ) -> ContinueRequestCommand:
        """
        Creates a command to continue a paused fetch request.

        This command allows the browser to resume a fetch operation that has
        been intercepted. You can modify the fetch request URL, method,
        headers, and body before continuing.

        Args:
            request_id (str): The ID of the fetch request to continue.
            url (Optional[str]): The new URL for the fetch request. Defaults to None.
            method (Optional[RequestMethod]): The HTTP method to use (e.g., 'GET',
                'POST'). Defaults to None.
            post_data (Optional[dict]): The body data to send with the fetch
                request. Defaults to None.
            headers (Optional[list[HeaderEntry]]): A list of HTTP headers to include
                in the fetch request. Defaults to None.
            intercept_response (Optional[bool]): Indicates if the response
                should be intercepted. Defaults to None.

        Returns:
            Command[Response]: A command for continuing the fetch request.
        """
        params = ContinueRequestParams(requestId=request_id)
        if url is not None:
            params['url'] = url
        if method is not None:
            params['method'] = method
        if post_data is not None:
            params['postData'] = post_data
        if headers is not None:
            params['headers'] = headers
        if intercept_response is not None:
            params['interceptResponse'] = intercept_response
        return Command(method=FetchMethod.CONTINUE_REQUEST, params=params)

    @staticmethod
    def continue_request_with_auth(
        request_id: str,
        auth_challenge_response: AuthChallengeResponseType,
        proxy_username: Optional[str] = None,
        proxy_password: Optional[str] = None,
    ) -> ContinueWithAuthCommand:
        """
        Creates a command to continue a paused fetch request with
        authentication.

        This command is used when the fetch operation requires authentication.
        It provides the necessary credentials to continue the request.

        Args:
            request_id (str): The ID of the fetch request to continue.
            auth_challenge_response (AuthChallengeResponseType): The authentication
                challenge response type.
            proxy_username (Optional[str]): The username for proxy authentication.
                Defaults to None.
            proxy_password (Optional[str]): The password for proxy authentication.
                Defaults to None.

        Returns:
            Command[Response]: A command for continuing the fetch request with
                authentication.
        """
        auth_challenge_response_dict = AuthChallengeResponse(response=auth_challenge_response)
        if proxy_username is not None:
            auth_challenge_response_dict['username'] = proxy_username
        if proxy_password is not None:
            auth_challenge_response_dict['password'] = proxy_password

        params = ContinueWithAuthParams(
            requestId=request_id,
            authChallengeResponse=auth_challenge_response_dict,
        )
        return Command(method=FetchMethod.CONTINUE_WITH_AUTH, params=params)

    @staticmethod
    def disable() -> DisableCommand:
        """
        Creates a command to disable fetch interception.

        This command stops the browser from intercepting fetch requests.

        Returns:
            Command[Response]: A command for disabling fetch interception.
        """
        return Command(method=FetchMethod.DISABLE)

    @staticmethod
    def enable(
        handle_auth_requests: bool,
        url_pattern: str = '*',
        resource_type: Optional['ResourceType'] = None,
        request_stage: Optional['RequestStage'] = None,
    ) -> EnableCommand:
        """
        Creates a command to enable fetch interception.

        This command allows the browser to start intercepting fetch requests.
        You can specify whether to handle authentication challenges and the
        types of resources to intercept.

        Args:
            handle_auth_requests (bool): Indicates if authentication requests
                should be handled.
            url_pattern (str): Pattern to match URLs for interception. Defaults to '*'.
            resource_type (Optional[ResourceType]): The type of resource to intercept.
                Defaults to None.
            request_stage (Optional[RequestStage]): The stage of the request to intercept.
                Defaults to None.

        Returns:
            Command[Response]: A command for enabling fetch interception.
        """
        request_pattern = RequestPattern(urlPattern=url_pattern)
        if resource_type is not None:
            request_pattern['resourceType'] = resource_type
        if request_stage is not None:
            request_pattern['requestStage'] = request_stage

        params = EnableParams(patterns=[request_pattern], handleAuthRequests=handle_auth_requests)
        return Command(method=FetchMethod.ENABLE, params=params)

    @staticmethod
    def fail_request(request_id: str, error_reason: ErrorReason) -> FailRequestCommand:
        """
        Creates a command to simulate a failure in a fetch request.

        This command allows you to simulate a failure for a specific fetch
        operation, providing a reason for the failure.

        Args:
            request_id (str): The ID of the fetch request to fail.
            error_reason (ErrorReason): The reason for the failure.

        Returns:
            Command[Response]: A command for failing the fetch request.
        """
        params = FailRequestParams(requestId=request_id, errorReason=error_reason)
        return Command(method=FetchMethod.FAIL_REQUEST, params=params)

    @staticmethod
    def fulfill_request(
        request_id: str,
        response_code: int,
        response_headers: Optional[list['HeaderEntry']] = None,
        body: Optional[str] = None,
        response_phrase: Optional[str] = None,
    ) -> FulfillRequestCommand:
        """
        Creates a command to fulfill a fetch request with a custom response.

        This command allows you to provide a custom response for a fetch
        operation, including the HTTP status code, headers, and body content.

        Args:
            request_id (str): The ID of the fetch request to fulfill.
            response_code (int): The HTTP status code to return.
            response_headers (Optional[list[HeaderEntry]]): A list of response headers.
                Defaults to None.
            body (Optional[dict]): The body content of the response. Defaults to None.
            response_phrase (Optional[str]): The response phrase (e.g., 'OK',
                'Not Found'). Defaults to None.

        Returns:
            Command[Response]: A command for fulfilling the fetch request.
        """
        params = FulfillRequestParams(
            requestId=request_id,
            responseCode=response_code,
        )
        if response_headers is not None:
            params['responseHeaders'] = response_headers
        if body is not None:
            params['body'] = body
        if response_phrase is not None:
            params['responsePhrase'] = response_phrase
        return Command(method=FetchMethod.FULFILL_REQUEST, params=params)

    @staticmethod
    def get_response_body(request_id: str) -> GetResponseBodyCommand:
        """
        Creates a command to retrieve the response body of a fetch request.

        This command allows you to access the body of a completed fetch
        operation, which can be useful for analyzing the response data.

        Args:
            request_id (str): The ID of the fetch request to retrieve the body
                from.

        Returns:
            Command[GetResponseBodyResponse]: A command for getting the response body.
        """
        params = GetResponseBodyParams(requestId=request_id)
        return Command(method=FetchMethod.GET_RESPONSE_BODY, params=params)

    @staticmethod
    def continue_response(
        request_id: str,
        response_code: Optional[int] = None,
        response_headers: Optional[list['HeaderEntry']] = None,
        response_phrase: Optional[str] = None,
    ) -> ContinueResponseCommand:
        """
        Creates a command to continue a fetch response for an intercepted
        request.

        This command allows the browser to continue the response flow for a
        specific fetch request, including customizing the HTTP status code,
        headers, and response phrase.

        Args:
            request_id (str): The ID of the fetch request to continue the
                response for.
            response_code (Optional[int]): The HTTP status code to send.
                Defaults to None.
            response_headers (Optional[list[HeaderEntry]]): A list of response headers.
                Defaults to None.
            response_phrase (Optional[str]): The response phrase (e.g., 'OK').
                Defaults to None.

        Returns:
            Command[Response]: A command for continuing the fetch response.
        """
        params = ContinueResponseParams(requestId=request_id)
        if response_code is not None:
            params['responseCode'] = response_code
        if response_headers is not None:
            params['responseHeaders'] = response_headers
        if response_phrase is not None:
            params['responsePhrase'] = response_phrase
        return Command(method=FetchMethod.CONTINUE_RESPONSE, params=params)

    @staticmethod
    def take_response_body_as_stream(
        request_id: str,
    ) -> TakeResponseBodyAsStreamCommand:
        """
        Creates a command to take the response body as a stream.

        This command allows you to receive the response body as a stream
        which can be useful for handling large responses.

        Args:
            request_id (str): The ID of the fetch request to take the response
                body stream from.

        Returns:
            Command[TakeResponseBodyAsStreamResponse]: A command for taking the response
                body as a stream.
        """
        params = TakeResponseBodyAsStreamParams(requestId=request_id)
        return Command(method=FetchMethod.TAKE_RESPONSE_BODY_AS_STREAM, params=params)


================================================
FILE: pydoll/commands/input_commands.py
================================================
from __future__ import annotations

from typing import TYPE_CHECKING, Optional

from pydoll.protocol.base import Command
from pydoll.protocol.input.methods import (
    DispatchDragEventParams,
    DispatchKeyEventParams,
    DispatchMouseEventParams,
    DispatchTouchEventParams,
    EmulateTouchFromMouseEventParams,
    ImeSetCompositionParams,
    InputMethod,
    InsertTextParams,
    SetIgnoreInputEventsParams,
    SetInterceptDragsParams,
    SynthesizePinchGestureParams,
    SynthesizeScrollGestureParams,
    SynthesizeTapGestureParams,
)

if TYPE_CHECKING:
    from pydoll.protocol.input.methods import (
        CancelDraggingCommand,
        DispatchDragEventCommand,
        DispatchKeyEventCommand,
        DispatchMouseEventCommand,
        DispatchTouchEventCommand,
        DragData,
        EmulateTouchFromMouseEventCommand,
        ImeSetCompositionCommand,
        InsertTextCommand,
        SetIgnoreInputEventsCommand,
        SetInterceptDragsCommand,
        SynthesizePinchGestureCommand,
        SynthesizeScrollGestureCommand,
        SynthesizeTapGestureCommand,
        TouchPoint,
    )
    from pydoll.protocol.input.types import (
        DragEventType,
        GestureSourceType,
        KeyEventType,
        KeyLocation,
        KeyModifier,
        MouseButton,
        MouseEventType,
        PointerType,
        TouchEventType,
    )


class InputCommands:
    """
    A class for simulating user input events using Chrome DevTools Protocol.

    The Input domain provides methods for simulating user input, including:
    - Keyboard events (key presses, releases)
    - Mouse events (clicks, movements, wheel)
    - Touch events (taps, multi-touch gestures)
    - Drag and drop events
    - Synthetic gestures (pinch, scroll, tap)

    These methods allow for programmatic control of input events without requiring
    actual user interaction, making it useful for testing and automation.
    """

    @staticmethod
    def cancel_dragging() -> CancelDraggingCommand:
        """
        Generates a command to cancel any active dragging in the page.

        This is useful when you need to interrupt an ongoing drag operation
        that might have been started with dispatchDragEvent or by other means.

        Returns:
            Command: The CDP command to cancel dragging.
        """
        return Command(method=InputMethod.CANCEL_DRAGGING)

    @staticmethod
    def dispatch_key_event(  # noqa: PLR0912
        type: KeyEventType,
        modifiers: Optional[KeyModifier] = None,
        timestamp: Optional[float] = None,
        text: Optional[str] = None,
        unmodified_text: Optional[str] = None,
        key_identifier: Optional[str] = None,
        code: Optional[str] = None,
        key: Optional[str] = None,
        windows_virtual_key_code: Optional[int] = None,
        native_virtual_key_code: Optional[int] = None,
        auto_repeat: Optional[bool] = None,
        is_keypad: Optional[bool] = None,
        is_system_key: Optional[bool] = None,
        location: Optional[KeyLocation] = None,
        commands: Optional[list[str]] = None,
    ) -> DispatchKeyEventCommand:
        """
        Generates a command to dispatch a key event to the page.

        This method can simulate various types of keyboard events such as key presses,
        key releases, and character inputs.

        Args:
            type: Type of the key event. Allowed values: keyDown, keyUp, rawKeyDown, char.
                 - keyDown: Corresponds to a user pressing a key
                 - keyUp: Corresponds to a user releasing a key
                 - rawKeyDown: A physical key press, without the text processing
                 - char: Generates a character without explicit key events
            modifiers: Bit field representing pressed modifier keys. Values:
                      Alt=1, Ctrl=2, Meta/Command=4, Shift=8 (default: 0).
                      For example, to simulate Ctrl+Shift, use 10.
            timestamp: Time at which the event occurred, in seconds since epoch.
            text: Text as generated by processing a virtual key code with a keyboard layout.
                 Not needed for 'keyUp' and 'rawKeyDown' events (default: "").
            unmodified_text: Text that would have been generated by the keyboard without modifiers
                           (except for shift). Useful for shortcut key handling (default: "").
            key_identifier: Unique key identifier (e.g., 'U+0041') (default: "").
            code: Unique DOM defined string value for each physical key (e.g., 'KeyA')
                (default: "").
            key: Unique DOM defined string value describing the meaning of the key in the
                context of active modifiers, keyboard layout, etc. (e.g., 'AltGr')
                (default: "").
            windows_virtual_key_code: Windows virtual key code (default: 0).
            native_virtual_key_code: Native virtual key code (default: 0).
            auto_repeat: Whether the event was generated from auto repeat (default: false).
            is_keypad: Whether the event was generated from the keypad (default: false).
            is_system_key: Whether the event was a system key event (default: false).
            location: Whether the event was from the left or right side of the keyboard:
                     0=Default, 1=Left, 2=Right (default: 0).
            commands: Editing commands to send with the key event (e.g., 'selectAll')
                     (default: []). These are related to but not equal to the command names
                     used in `document.execCommand` and NSStandardKeyBindingResponding.

        Returns:
            Command: The CDP command to dispatch the key event.
        """
        params = DispatchKeyEventParams(type=type)
        if modifiers is not None:
            params['modifiers'] = modifiers
        if timestamp is not None:
            params['timestamp'] = timestamp
        if text is not None:
            params['text'] = text
        if unmodified_text is not None:
            params['unmodifiedText'] = unmodified_text
        if key_identifier is not None:
            params['keyIdentifier'] = key_identifier
        if code is not None:
            params['code'] = code
        if key is not None:
            params['key'] = key
        if windows_virtual_key_code is not None:
            params['windowsVirtualKeyCode'] = windows_virtual_key_code
        if native_virtual_key_code is not None:
            params['nativeVirtualKeyCode'] = native_virtual_key_code
        if auto_repeat is not None:
            params['autoRepeat'] = auto_repeat
        if is_keypad is not None:
            params['isKeypad'] = is_keypad
        if is_system_key is not None:
            params['isSystemKey'] = is_system_key
        if location is not None:
            params['location'] = location
        if commands is not None:
            params['commands'] = commands
        return Command(method=InputMethod.DISPATCH_KEY_EVENT, params=params)

    @staticmethod
    def dispatch_mouse_event(
        type: MouseEventType,
        x: int,
        y: int,
        modifiers: Optional[KeyModifier] = None,
        timestamp: Optional[float] = None,
        button: Optional[MouseButton] = None,
        click_count: Optional[int] = None,
        force: Optional[float] = None,
        tangential_pressure: Optional[float] = None,
        tilt_x: Optional[float] = None,
        tilt_y: Optional[float] = None,
        twist: Optional[int] = None,
        delta_x: Optional[float] = None,
        delta_y: Optional[float] = None,
        pointer_type: Optional[PointerType] = None,
    ) -> DispatchMouseEventCommand:
        """
        Generates a command to dispatch a mouse event to the page.

        This method allows simulating various mouse interactions such as clicks,
        movements, and wheel scrolling.

        Args:
            type: Type of the mouse event. Allowed values:
                 - mousePressed: Mouse button pressed
                 - mouseReleased: Mouse button released
                 - mouseMoved: Mouse moved
                 - mouseWheel: Mouse wheel rotated
            x: X coordinate of the event relative to the main frame's viewport in CSS pixels.
            y: Y coordinate of the event relative to the main frame's viewport in CSS pixels.
                0 refers to the top of the viewport, and Y increases going down.
            modifiers: Bit field representing pressed modifier keys. Values:
                Alt=1, Ctrl=2, Meta/Command=4, Shift=8 (default: 0).
            timestamp: Time at which the event occurred, in seconds since epoch.
            button: Mouse button being pressed/released. Default is "none".
                Allowed values: "none", "left", "middle", "right", "back", "forward".
            click_count: Number of times the mouse button was clicked (default: 0).
                For example, 2 for a double-click.
            force: The normalized pressure, which has a range of [0,1] (default: 0).
                Used primarily for pressure-sensitive inputs.
            tangential_pressure: The normalized tangential pressure, which has a range
                of [-1,1] (default: 0). Used for stylus input.
            tilt_x: The plane angle between the Y-Z plane and the plane containing both the stylus
                axis and the Y axis, in degrees of the range [-90,90]. A positive tiltX is
                to the right (default: 0).
            tilt_y: The plane angle between the X-Z plane and the plane containing both the stylus
                axis and the X axis, in degrees of the range [-90,90]. A positive tiltY is
                towards the user (default: 0).
            twist: The clockwise rotation of a pen stylus around its own major axis,
                in degrees in the range [0,359] (default: 0).
            delta_x: X delta in CSS pixels for mouse wheel event (default: 0).
                Positive values scroll right.
            delta_y: Y delta in CSS pixels for mouse wheel event (default: 0).
                Positive values scroll up.
            pointer_type: Pointer type (default: "mouse"). Allowed values: "mouse", "pen".

        Returns:
            Command: The CDP command to dispatch the mouse event.
        """
        params = DispatchMouseEventParams(type=type, x=x, y=y)
        if modifiers is not None:
            params['modifiers'] = modifiers
        if timestamp is not None:
            params['timestamp'] = timestamp
        if button is not None:
            params['button'] = button
        if click_count is not None:
            params['clickCount'] = click_count
        if force is not None:
            params['force'] = force
        if tangential_pressure is not None:
            params['tangentialPressure'] = tangential_pressure
        if tilt_x is not None:
            params['tiltX'] = tilt_x
        if tilt_y is not None:
            params['tiltY'] = tilt_y
        if twist is not None:
            params['twist'] = twist
        if delta_x is not None:
            params['deltaX'] = delta_x
        if delta_y is not None:
            params['deltaY'] = delta_y
        if pointer_type is not None:
            params['pointerType'] = pointer_type
        return Command(method=InputMethod.DISPATCH_MOUSE_EVENT, params=params)

    @staticmethod
    def dispatch_touch_event(
        type: TouchEventType,
        touch_points: list[TouchPoint],
        modifiers: Optional[KeyModifier] = None,
        timestamp: Optional[float] = None,
    ) -> DispatchTouchEventCommand:
        """
        Generates a command to dispatch a touch event to the page.

        This method allows simulating touch interactions on touch-enabled devices
        or emulated touch environments.

        Args:
            type: Type of the touch event. Allowed values:
                 - touchStart: Touch started - at least one point must be specified
                 - touchEnd: Touch ended - points that are no longer pressed should be removed
                 - touchMove: Touch moved - active points should be updated
                 - touchCancel: Touch canceled - clears all touch points
                 Touch end and cancel events must not contain any touch points,
                 while touch start and move must contain at least one.
            touch_points: list of active touch points. One event per any changed point
                        (compared to previous event) is generated, emulating
                        pressing/moving/releasing points one by one.
                        Each point includes coordinates and other properties.
            modifiers: Bit field representing pressed modifier keys. Values:
                      Alt=1, Ctrl=2, Meta/Command=4, Shift=8 (default: 0).
            timestamp: Time at which the event occurred, in seconds since epoch.

        Returns:
            Command: The CDP command to dispatch the touch event.
        """
        params = DispatchTouchEventParams(type=type, touchPoints=touch_points)
        if modifiers is not None:
            params['modifiers'] = modifiers
        if timestamp is not None:
            params['timestamp'] = timestamp
        return Command(method=InputMethod.DISPATCH_TOUCH_EVENT, params=params)

    @staticmethod
    def set_ignore_input_events(ignore: bool) -> SetIgnoreInputEventsCommand:
        """
        Generates a command to ignore input events (useful while auditing page).

        When ignore is true, all input events will be ignored, which can be useful
        during automated tests or when you want to prevent user interaction
        while performing certain operations.

        Args:
            ignore: If true, input events processing will be ignored.

        Returns:
            Command: The CDP command to set ignore input events.
        """
        params = SetIgnoreInputEventsParams(ignore=ignore)
        return Command(method=InputMethod.SET_IGNORE_INPUT_EVENTS, params=params)

    @staticmethod
    def dispatch_drag_event(
        type: DragEventType,
        x: int,
        y: int,
        data: DragData,
        modifiers: Optional[KeyModifier] = None,
    ) -> DispatchDragEventCommand:
        """
        Generates a command to dispatch a drag event into the page.

        This experimental method allows simulating drag and drop operations
        by dispatching drag events at specific coordinates.

        Args:
            type: Type of the drag event. Allowed values:
                 - dragEnter: Fired when a dragged item enters a valid drop target
                 - dragOver: Fired when a dragged item is being dragged over a valid drop target
                 - drop: Fired when an item is dropped on a valid drop target
                 - dragCancel: Fired when a drag operation is being canceled
            x: X coordinate of the event relative to the main frame's viewport in CSS pixels.
            y: Y coordinate of the event relative to the main frame's viewport in CSS pixels.
                0 refers to the top of the viewport, and Y increases going down.
            data: Drag data containing items being dragged, their MIME types, and other information.
            modifiers: Bit field representing pressed modifier keys. Values:
                      Alt=1, Ctrl=2, Meta/Command=4, Shift=8 (default: 0).

        Returns:
            Command: The CDP command to dispatch the drag event.
        """
        params = DispatchDragEventParams(type=type, data=data, x=x, y=y)
        if modifiers is not None:
            params['modifiers'] = modifiers
        return Command(method=InputMethod.DISPATCH_DRAG_EVENT, params=params)

    @staticmethod
    def emulate_touch_from_mouse_event(  # noqa: PLR0913, PLR0917
        type: MouseEventType,
        x: int,
        y: int,
        button: MouseButton,
        timestamp: Optional[float] = None,
        delta_x: Optional[float] = None,
        delta_y: Optional[float] = None,
        modifiers: Optional[KeyModifier] = None,
        click_count: Optional[int] = None,
    ) -> EmulateTouchFromMouseEventCommand:
        """
        Generates a command to emulate touch event from the mouse event parameters.

        This experimental method allows converting mouse events into touch events,
        useful for testing touch interactions in environments where touch is not available.

        Args:
            type: Type of the mouse event to convert. Allowed values:
                 - mousePressed: Converted to touchStart
                 - mouseReleased: Converted to touchEnd
                 - mouseMoved: Converted to touchMove
                 - mouseWheel: May trigger scrolling
            x: X coordinate of the mouse pointer in device-independent pixels (DIP).
            y: Y coordinate of the mouse pointer in DIP.
            button: Mouse button. Only "none", "left", "right" are supported.
            timestamp: Time at which the event occurred, in seconds since epoch.
                      Default is current time.
            delta_x: X delta in DIP for mouse wheel event (default: 0). Used for scrolling.
            delta_y: Y delta in DIP for mouse wheel event (default: 0). Used for scrolling.
            modifiers: Bit field representing pressed modifier keys. Values:
                      Alt=1, Ctrl=2, Meta/Command=4, Shift=8 (default: 0).
            click_count: Number of times the mouse button was clicked (default: 0).
                       For example, 2 for a double-click.

        Returns:
            Command: The CDP command to emulate touch from mouse event.
        """
        params = EmulateTouchFromMouseEventParams(type=type, x=x, y=y, button=button)
        if timestamp is not None:
            params['timestamp'] = timestamp
        if delta_x is not None:
            params['deltaX'] = delta_x
        if delta_y is not None:
            params['deltaY'] = delta_y
        if modifiers is not None:
            params['modifiers'] = modifiers
        if click_count is not None:
            params['clickCount'] = click_count
        return Command(method=InputMethod.EMULATE_TOUCH_FROM_MOUSE_EVENT, params=params)

    @staticmethod
    def ime_set_composition(
        text: str,
        selection_start: int,
        selection_end: int,
        replacement_start: Optional[int] = None,
        replacement_end: Optional[int] = None,
    ) -> ImeSetCompositionCommand:
        """
        Generates a command to set the current candidate text for IME.

        This experimental method sets the text for Input Method Editors (IME),
        which are used for entering characters in languages that require more
        keystrokes than the number of characters (like Chinese, Japanese, Korean).

        Use imeCommitComposition to commit the final text.
        Use imeSetComposition with empty string as text to cancel composition.

        Args:
            text: The text to insert as the IME composition.
            selection_start: Start position of the selection within the composition text.
            selection_end: End position of the selection within the composition text.
            replacement_start: Start position of the text to be replaced
                (default: same as selection_start).
            replacement_end: End position of the text to be replaced
                (default: same as selection_end).

        Returns:
            Command: The CDP command to set IME composition.
        """
        params = ImeSetCompositionParams(
            text=text,
            selectionStart=selection_start,
            selectionEnd=selection_end,
        )
        if replacement_start is not None:
            params['replacementStart'] = replacement_start
        if replacement_end is not None:
            params['replacementEnd'] = replacement_end
        return Command(method=InputMethod.IME_SET_COMPOSITION, params=params)

    @staticmethod
    def insert_text(
        text: str,
    ) -> InsertTextCommand:
        """
        Generates a command to emulate inserting text that doesn't come from a key press.

        This experimental method is useful for inserting text that would normally
        come from sources other than keyboard, such as emoji pickers, IMEs, or
        clipboard pastes.

        Args:
            text: The text to insert.

        Returns:
            Command: The CDP command to insert text.
        """
        params = InsertTextParams(text=text)
        return Command(method=InputMethod.INSERT_TEXT, params=params)

    @staticmethod
    def set_intercept_drags(enabled: bool) -> SetInterceptDragsCommand:
        """
        Generates a command to control interception of drag and drop events.

        This experimental method prevents default drag and drop behavior and instead
        emits Input.dragIntercepted events. Drag and drop behavior can then be
        directly controlled via Input.dispatchDragEvent.

        This is useful for implementing custom drag and drop logic or for testing
        drag and drop behavior in automated tests.

        Args:
            enabled: If true, drag events will be intercepted and reported as
                    dragIntercepted events, preventing the default behavior.

        Returns:
            Command: The CDP command to set drag interception.
        """
        params = SetInterceptDragsParams(enabled=enabled)
        return Command(method=InputMethod.SET_INTERCEPT_DRAGS, params=params)

    @staticmethod
    def synthesize_pinch_gesture(
        x: int,
        y: int,
        scale_factor: float,
        relative_speed: Optional[int] = None,
        gesture_source_type: Optional[GestureSourceType] = None,
    ) -> SynthesizePinchGestureCommand:
        """
        Generates a command to synthesize a pinch gesture over a time period.

        This experimental method creates a synthetic pinch gesture (zoom in/out)
        by issuing appropriate touch events over time. This is useful for testing
        pinch-to-zoom functionality in web applications.

        Args:
            x: X coordinate of the start of the gesture in CSS pixels.
            y: Y coordinate of the start of the gesture in CSS pixels.
            scale_factor: Relative scale factor after zooming:
                        - >1.0 zooms in (fingers moving apart)
                        - <1.0 zooms out (fingers moving together)
            relative_speed: Relative pointer speed in pixels per second (default: 800).
                          Controls how fast the gesture happens.
            gesture_source_type: Which type of input events to be generated:
                              - 'default': Platform's preferred input type
                              - 'touch': Touch input
                              - 'mouse': Mouse input

        Returns:
            Command: The CDP command to synthesize a pinch gesture.
        """
        params = SynthesizePinchGestureParams(x=x, y=y, scaleFactor=scale_factor)
        if relative_speed is not None:
            params['relativeSpeed'] = relative_speed
        if gesture_source_type is not None:
            params['gestureSourceType'] = gesture_source_type
        return Command(method=InputMethod.SYNTHESIZE_PINCH_GESTURE, params=params)

    @staticmethod
    def synthesize_scroll_gesture(
        x: int,
        y: int,
        x_distance: Optional[float] = None,
        y_distance: Optional[float] = None,
        x_overscroll: Optional[float] = None,
        y_overscroll: Optional[float] = None,
        prevent_fling: Optional[bool] = None,
        speed: Optional[int] = None,
        gesture_source_type: Optional[GestureSourceType] = None,
        repeat_count: Optional[int] = None,
        repeat_delay_ms: Optional[int] = None,
        interaction_marker_name: Optional[str] = None,
    ) -> SynthesizeScrollGestureCommand:
        """
        Generates a command to synthesize a scroll gesture over a time period.

        This experimental method creates a synthetic scroll gesture by issuing
        appropriate touch events over time. This is useful for testing scrolling
        behavior in web applications.

        Args:
            x: X coordinate of the start of the gesture in CSS pixels.
            y: Y coordinate of the start of the gesture in CSS pixels.
            x_distance: The distance to scroll along the X axis (positive to scroll left).
            y_distance: The distance to scroll along the Y axis (positive to scroll up).
            x_overscroll: The number of additional pixels to scroll back along the X axis,
                        in addition to the given distance. This creates an overscroll
                        effect (rubber-banding).
            y_overscroll: The number of additional pixels to scroll back along the Y axis,
                        in addition to the given distance. This creates an overscroll
                        effect (rubber-banding).
            prevent_fling: Prevent fling (default: true). If false, a fling animation might
                         continue after the gesture.
            speed: Swipe speed in pixels per second (default: 800).
            gesture_source_type: Which type of input events to be generated:
                              - 'default': Platform's preferred input type
                              - 'touch': Touch input
                              - 'mouse': Mouse input
            repeat_count: The number of times to repeat the gesture (default: 0).
            repeat_delay_ms: The number of milliseconds delay between each repeat (default: 250).
            interaction_marker_name: The name of the interaction markers to generate, if not empty.
                                  Used for tracking gesture timing in performance measurements.

        Returns:
            Command: The CDP command to synthesize a scroll gesture.
        """
        params = SynthesizeScrollGestureParams(x=x, y=y)
        if x_distance is not None:
            params['xDistance'] = x_distance
        if y_distance is not None:
            params['yDistance'] = y_distance
        if x_overscroll is not None:
            params['xOverscroll'] = x_overscroll
        if y_overscroll is not None:
            params['yOverscroll'] = y_overscroll
        if prevent_fling is not None:
            params['preventFling'] = prevent_fling
        if speed is not None:
            params['speed'] = speed
        if gesture_source_type is not None:
            params['gestureSourceType'] = gesture_source_type
        if repeat_count is not None:
            params['repeatCount'] = repeat_count
        if repeat_delay_ms is not None:
            params['repeatDelayMs'] = repeat_delay_ms
        if interaction_marker_name is not None:
            params['interactionMarkerName'] = interaction_marker_name
        return Command(method=InputMethod.SYNTHESIZE_SCROLL_GESTURE, params=params)

    @staticmethod
    def synthesize_tap_gesture(
        x: int,
        y: int,
        duration: Optional[int] = None,
        tap_count: Optional[int] = None,
        gesture_source_type: Optional[GestureSourceType] = None,
    ) -> SynthesizeTapGestureCommand:
        """
        Generates a command to synthesize a tap gesture over a time period.

        This experimental method creates a synthetic tap gesture by issuing
        appropriate touch events over time. This is useful for testing
        touch interaction in web applications.

        Args:
            x: X coordinate of the start of the gesture in CSS pixels.
            y: Y coordinate of the start of the gesture in CSS pixels.
            duration: Duration between touchdown and touchup events in milliseconds (default: 50).
                     Controls how long the tap gesture takes.
            tap_count: Number of times to perform the tap (e.g., 2 for a double tap, default: 1).
            gesture_source_type: Which type of input events to be generated:
                              - 'default': Platform's preferred input type
                              - 'touch': Touch input
                              - 'mouse': Mouse input

        Returns:
            Command: The CDP command to synthesize a tap gesture.
        """
        params = SynthesizeTapGestureParams(x=x, y=y)
        if duration is not None:
            params['duration'] = duration
        if tap_count is not None:
            params['tapCount'] = tap_count
        if gesture_source_type is not None:
            params['gestureSourceType'] = gesture_source_type
        return Command(method=InputMethod.SYNTHESIZE_TAP_GESTURE, params=params)


================================================
FILE: pydoll/commands/network_commands.py
================================================
from __future__ import annotations

from typing import TYPE_CHECKING, Optional

from pydoll.protocol.base import Command
from pydoll.protocol.network.methods import (
    DeleteCookiesParams,
    EmulateNetworkConditionsParams,
    EnableReportingApiParams,
    GetCertificateParams,
    GetCookiesParams,
    GetRequestPostDataParams,
    GetResponseBodyForInterceptionParams,
    GetResponseBodyParams,
    GetSecurityIsolationStatusParams,
    LoadNetworkResourceParams,
    NetworkEnableParams,
    NetworkMethod,
    ReplayXHRParams,
    SearchInResponseBodyParams,
    SetAcceptedEncodingsParams,
    SetAttachDebugStackParams,
    SetBlockedURLsParams,
    SetBypassServiceWorkerParams,
    SetCacheDisabledParams,
    SetCookieControlsParams,
    SetCookieParams,
    SetCookiesParams,
    SetExtraHTTPHeadersParams,
    SetUserAgentOverrideParams,
    StreamResourceContentParams,
    TakeResponseBodyForInterceptionAsStreamParams,
)

if TYPE_CHECKING:
    from pydoll.protocol.emulation.types import UserAgentMetadata
    from pydoll.protocol.network.methods import (
        ClearAcceptedEncodingsOverrideCommand,
        ClearBrowserCacheCommand,
        ClearBrowserCookiesCommand,
        ClearCookiesCommand,
        DisableCommand,
        EmulateNetworkConditionsCommand,
        EnableCommand,
        EnableReportingApiCommand,
        GetCertificateCommand,
        GetCookiesCommand,
        GetRequestPostDataCommand,
        GetResponseBodyCommand,
        GetResponseBodyForInterceptionCommand,
        GetSecurityIsolationStatusCommand,
        HeaderEntry,
        LoadNetworkResourceCommand,
        ReplayXHRCommand,
        SearchInResponseBodyCommand,
        SetAcceptedEncodingsCommand,
        SetAttachDebugStackCommand,
        SetBlockedURLsCommand,
        SetBypassServiceWorkerCommand,
        SetCacheDisabledCommand,
        SetCookieCommand,
        SetCookieControlsCommand,
        SetCookiesCommand,
        SetExtraHTTPHeadersCommand,
        SetUserAgentOverrideCommand,
        StreamResourceContentCommand,
        TakeResponseBodyForInterceptionAsStreamCommand,
    )
    from pydoll.protocol.network.types import (
        ConnectionType,
        ContentEncoding,
        CookiePartitionKey,
        CookiePriority,
        CookieSameSite,
        CookieSourceScheme,
        LoadNetworkResourceOptions,
    )


class NetworkCommands:
    """
    Implementation of Chrome DevTools Protocol for the Network domain.

    This class provides commands for monitoring and manipulating network activities,
    enabling detailed inspection and control over HTTP requests and responses.
    The Network domain exposes comprehensive network-related information including:
    - Request/response headers and bodies
    - Resource timing and caching behavior
    - Cookie management and security details
    - Network conditions emulation
    - Traffic interception and modification

    The commands allow developers to analyze performance, debug network issues,
    and test application behavior under various network conditions.
    """

    @staticmethod
    def clear_browser_cache() -> ClearBrowserCacheCommand:
        """
        Clears browser cache storage.

        This command is essential for testing cache behavior and ensuring fresh
        resource loading. It affects all cached resources including:
        - CSS/JavaScript files
        - Images and media assets
        - API response caching

        Use cases:
        - Testing cache invalidation strategies
        - Reproducing issues with stale content
        - Performance benchmarking without cache influence

        Returns:
            Command: CDP command to clear the entire browser cache
        """
        return Command(method=NetworkMethod.CLEAR_BROWSER_CACHE)

    @staticmethod
    def clear_browser_cookies() -> ClearBrowserCookiesCommand:
        """
        Command to clear all cookies stored in the browser.

        This can be beneficial for testing scenarios where you need
        to simulate a fresh user session without any previously stored
        cookies that might affect the application's behavior.

        Returns:
            Command[Response]: A command to clear all cookies in the browser.
        """
        return Command(method=NetworkMethod.CLEAR_BROWSER_COOKIES)

    @staticmethod
    def delete_cookies(
        name: str,
        url: Optional[str] = None,
        domain: Optional[str] = None,
        path: Optional[str] = None,
        partition_key: Optional[CookiePartitionKey] = None,
    ) -> ClearCookiesCommand:
        """
        Deletes browser cookies with matching criteria.

        Provides granular control over cookie removal through multiple parameters:
        - Delete by name only (affects all matching cookies)
        - Scope deletion using URL, domain, or path
        - Handle partitioned cookies for privacy-aware applications

        Args:
            name: Name of the cookies to remove (required)
            url: Delete cookies for specific URL (domain/path must match)
            domain: Exact domain for cookie deletion
            path: Exact path for cookie deletion
            partition_key: Partition key attributes for cookie isolation

        Returns:
            Command: CDP command to execute selective cookie deletion
        """
        params = DeleteCookiesParams(name=name)
        if url is not None:
            params['url'] = url
        if domain is not None:
            params['domain'] = domain
        if path is not None:
            params['path'] = path
        if partition_key is not None:
            params['partitionKey'] = partition_key
        return Command(method=NetworkMethod.DELETE_COOKIES, params=params)

    @staticmethod
    def disable() -> DisableCommand:
        """
        Stops network monitoring and event reporting.

        Preserves network state but stops:
        - Request/response events
        - WebSocket message tracking
        - Loading progress notifications

        Use when:
        - Reducing overhead during non-network operations
        - Pausing monitoring temporarily
        - Finalizing network-related tests

        Returns:
            Command: CDP command to disable network monitoring
        """
        return Command(method=NetworkMethod.DISABLE)

    @staticmethod
    def enable(
        max_total_buffer_size: Optional[int] = None,
        max_resource_buffer_size: Optional[int] = None,
        max_post_data_size: Optional[int] = None,
    ) -> EnableCommand:
        """
        Enables network monitoring with configurable buffers.

        Args:
            max_total_buffer_size: Total memory buffer for network data (bytes)
            max_resource_buffer_size: Per-resource buffer limit (bytes)
            max_post_data_size: Maximum POST payload to capture (bytes)

        Recommended settings:
        - Increase buffers for long-running sessions
        - Adjust post size for API testing
        - Monitor memory usage with large buffers

        Returns:
            Command: CDP command to enable network monitoring
        """
        params = NetworkEnableParams()
        if max_total_buffer_size is not None:
            params['maxTotalBufferSize'] = max_total_buffer_size
        if max_resource_buffer_size is not None:
            params['maxResourceBufferSize'] = max_resource_buffer_size
        if max_post_data_size is not None:
            params['maxPostDataSize'] = max_post_data_size
        return Command(method=NetworkMethod.ENABLE, params=params)

    @staticmethod
    def get_cookies(
        urls: Optional[list[str]] = None,
    ) -> GetCookiesCommand:
        """
        Retrieves cookies matching specified URLs.

        Args:
            urls: list of URLs to scope cookie retrieval

        Returns:
            Command: CDP command returning cookie details including:
                - Name, value, and attributes
                - Security and scope parameters
                - Expiration and size information

        Usage notes:
        - Empty URL list returns all cookies
        - Includes HTTP-only and secure cookies
        - Shows partitioned cookie status
        """
        params = GetCookiesParams()
        if urls is not None:
            params['urls'] = urls
        return Command(method=NetworkMethod.GET_COOKIES, params=params)

    @staticmethod
    def get_request_post_data(
        request_id: str,
    ) -> GetRequestPostDataCommand:
        """
        Retrieves POST data from a specific network request.

        Essential for:
        - Form submission analysis
        - API request debugging
        - File upload monitoring
        - Security testing

        Args:
            request_id: Unique identifier for the network request

        Returns:
            Command: CDP command that returns:
                - Raw POST data content
                - Multipart form data (excluding file contents)
                - Content encoding information

        Note: Large POST bodies may be truncated based on buffer settings
        """
        params = GetRequestPostDataParams(requestId=request_id)
        return Command(method=NetworkMethod.GET_REQUEST_POST_DATA, params=params)

    @staticmethod
    def get_response_body(
        request_id: str,
    ) -> GetResponseBodyCommand:
        """
        Retrieves the full content of a network response.

        Supports various content types:
        - Text-based resources (HTML, CSS, JSON)
        - Base64-encoded binary content (images, media)
        - Gzip/deflate compressed responses

        Args:
            request_id: Unique network request identifier

        Important considerations:
        - Response must be available in browser memory
        - Large responses may require streaming approaches
        - Sensitive data should be handled securely

        Returns:
            Command: CDP command returning response body and encoding details
        """
        params = GetResponseBodyParams(requestId=request_id)
        return Command(method=NetworkMethod.GET_RESPONSE_BODY, params=params)

    @staticmethod
    def set_cache_disabled(cache_disabled: bool) -> SetCacheDisabledCommand:
        """
        Controls browser's cache mechanism.

        Use cases:
        - Testing resource update behavior
        - Forcing fresh content loading
        - Performance impact analysis
        - Cache-busting scenarios

        Args:
            cache_disabled: True to disable caching, False to enable

        Returns:
            Command: CDP command to modify cache behavior

        Note: Affects all requests until re-enabled
        """
        params = SetCacheDisabledParams(cacheDisabled=cache_disabled)
        return Command(method=NetworkMethod.SET_CACHE_DISABLED, params=params)

    @staticmethod
    def set_cookie(
        name: str,
        value: str,
        url: Optional[str] = None,
        domain: Optional[str] = None,
        path: Optional[str] = None,
        secure: Optional[bool] = None,
        http_only: Optional[bool] = None,
        same_site: Optional[CookieSameSite] = None,
        expires: Optional[float] = None,
        priority: Optional[CookiePriority] = None,
        same_party: Optional[bool] = None,
        source_scheme: Optional[CookieSourceScheme] = None,
        source_port: Optional[int] = None,
        partition_key: Optional[CookiePartitionKey] = None,
    ) -> SetCookieCommand:
        """
        Creates or updates a cookie with specified attributes.

        Comprehensive cookie control supporting:
        - Session and persistent cookies
        - Security attributes (Secure, HttpOnly)
        - SameSite policies
        - Cookie partitioning
        - Priority levels

        Args:
            name: Cookie name
            value: Cookie value
            url: Target URL for the cookie
            domain: Cookie domain scope
            path: Cookie path scope
            secure: Require HTTPS
            http_only: Prevent JavaScript access
            same_site: Cross-site access policy
            expires: Expiration timestamp
            priority: Cookie priority level
            same_party: First-Party Sets flag
            source_scheme: Cookie source context
            source_port: Source port restriction
            partition_key: Storage partition key

        Returns:
            Command: CDP command that returns success status

        Security considerations:
        - Use secure flag for sensitive data
        - Consider SameSite policies
        - Be aware of cross-site implications
        """
        params = SetCookieParams(name=name, value=value)

        if url is not None:
            params['url'] = url
        if domain is not None:
            params['domain'] = domain
        if path is not None:
            params['path'] = path
        if secure is not None:
            params['secure'] = secure
        if http_only is not None:
            params['httpOnly'] = http_only
        if same_site is not None:
            params['sameSite'] = same_site
        if expires is not None:
            params['expires'] = expires
        if priority is not None:
            params['priority'] = priority
        if same_party is not None:
            params['sameParty'] = same_party
        if source_scheme is not None:
            params['sourceScheme'] = source_scheme
        if source_port is not None:
            params['sourcePort'] = source_port
        if partition_key is not None:
            params['partitionKey'] = partition_key

        return Command(method=NetworkMethod.SET_COOKIE, params=params)

    @staticmethod
    def set_cookies(cookies: list[SetCookieParams]) -> SetCookiesCommand:
        """
        Sets multiple cookies in a single operation.

        Efficient for:
        - Batch cookie operations
        - Session state restoration
        - Testing multiple authentication states
        - Cross-domain cookie setup

        Args:
            cookies: list of cookie parameters including
                    name, value, and attributes

        Returns:
            Command: CDP command for bulk cookie setting

        Performance note:
        - More efficient than multiple set_cookie calls
        - Consider memory impact with large batches
        """
        params = SetCookiesParams(cookies=cookies)
        return Command(method=NetworkMethod.SET_COOKIES, params=params)

    @staticmethod
    def set_extra_http_headers(
        headers: list[HeaderEntry],
    ) -> SetExtraHTTPHeadersCommand:
        """
        Applies custom HTTP headers to all subsequent requests.

        Enables advanced scenarios:
        - A/B testing with custom headers
        - Authentication bypass for testing
        - Content negotiation simulations
        - Security header validation

        Args:
            headers: list of key-value header pairs

        Security notes:
        - Headers are applied browser-wide
        - Sensitive headers (e.g., Authorization) persist until cleared
        - Use with caution in shared environments

        Returns:
            Command: CDP command to set global HTTP headers
        """
        params = SetExtraHTTPHeadersParams(headers=headers)
        return Command(method=NetworkMethod.SET_EXTRA_HTTP_HEADERS, params=params)

    @staticmethod
    def set_useragent_override(
        user_agent: str,
        accept_language: Optional[str] = None,
        platform: Optional[str] = None,
        user_agent_metadata: Optional[UserAgentMetadata] = None,
    ) -> SetUserAgentOverrideCommand:
        """
        Overrides the browser's User-Agent string.

        Use cases:
        - Device/browser simulation
        - Compatibility testing
        - Content negotiation
        - Bot detection bypass

        Args:
            user_agent: Complete User-Agent string
            accept_language: Language preference header
            platform: Platform identifier
            user_agent_metadata: Detailed UA metadata

        Returns:
            Command: CDP command to override user agent

        Testing considerations:
        - Affects all subsequent requests
        - May impact server-side behavior
        - Consider mobile/desktop differences
        """
        params = SetUserAgentOverrideParams(userAgent=user_agent)
        if accept_language is not None:
            params['acceptLanguage'] = accept_language
        if platform is not None:
            params['platform'] = platform
        if user_agent_metadata is not None:
            params['userAgentMetadata'] = user_agent_metadata
        return Command(method=NetworkMethod.SET_USER_AGENT_OVERRIDE, params=params)

    @staticmethod
    def clear_accepted_encodings_override() -> ClearAcceptedEncodingsOverrideCommand:
        """
        Restores default content encoding acceptance.

        Effects:
        - Resets compression preferences
        - Restores default Accept-Encoding header
        - Allows server-chosen encoding

        Use when:
        - Testing encoding fallbacks
        - Debugging compression issues
        - Resetting after encoding tests

        Returns:
            Command: CDP command to clear encoding overrides
        """
        return Command(method=NetworkMethod.CLEAR_ACCEPTED_ENCODINGS_OVERRIDE)

    @staticmethod
    def enable_reporting_api(
        enabled: bool,
    ) -> EnableReportingApiCommand:
        """
        Controls the Reporting API functionality.

        Features:
        - Network error reporting
        - Deprecation notices
        - CSP violation reports
        - CORS issues

        Args:
            enabled: True to enable, False to disable

        Returns:
            Command: CDP command to configure Reporting API

        Note: Requires browser support for Reporting API
        """
        params = EnableReportingApiParams(enabled=enabled)
        return Command(method=NetworkMethod.ENABLE_REPORTING_API, params=params)

    @staticmethod
    def search_in_response_body(
        request_id: str,
        query: str,
        case_sensitive: bool = False,
        is_regex: bool = False,
    ) -> SearchInResponseBodyCommand:
        """
        Searches for content within response bodies.

        Powerful for:
        - Content verification
        - Security scanning
        - Data extraction
        - Response validation

        Args:
            request_id: Target response identifier
            query: Search string or pattern
            case_sensitive: Match case sensitivity
            is_regex: Use regular expression matching

        Returns:
            Command: CDP command returning match results

        Performance tip:
        - Use specific queries for large responses
        - Consider regex complexity
        """
        params = SearchInResponseBodyParams(requestId=request_id, query=query)
        if case_sensitive is not None:
            params['caseSensitive'] = case_sensitive
        if is_regex is not None:
            params['isRegex'] = is_regex
        return Command(method=NetworkMethod.SEARCH_IN_RESPONSE_BODY, params=params)

    @staticmethod
    def set_blocked_urls(urls: list[str]) -> SetBlockedURLsCommand:
        """
        Blocks specified URLs from loading.

        Key features:
        - Pattern-based URL blocking
        - Resource type filtering
        - Network request prevention
        - Error simulation

        Args:
            urls: list of URL patterns to block
                 Supports wildcards and pattern matching

        Returns:
            Command: CDP command to set URL blocking rules

        Common applications:
        - Ad/tracker blocking simulation
        - Resource loading control
        - Error handling testing
        - Network isolation testing
        """
        params = SetBlockedURLsParams(urls=urls)
        return Command(method=NetworkMethod.SET_BLOCKED_URLS, params=params)

    @staticmethod
    def set_bypass_service_worker(
        bypass: bool,
    ) -> SetBypassServiceWorkerCommand:
        """
        Controls Service Worker interception of network requests.

        Use cases:
        - Testing direct network behavior
        - Bypassing offline functionality
        - Debug caching issues
        - Performance comparison

        Args:
            bypass: True to skip Service Worker, False to allow

        Returns:
            Command: CDP command to configure Service Worker behavior

        Impact:
        - Affects offline capabilities
        - Changes caching behavior
        - Modifies push notifications
        """
        params = SetBypassServiceWorkerParams(bypass=bypass)
        return Command(method=NetworkMethod.SET_BYPASS_SERVICE_WORKER, params=params)

    @staticmethod
    def get_certificate(origin: str) -> GetCertificateCommand:
        """
        Retrieves SSL/TLS certificate information for a domain.

        Provides:
        - Certificate chain details
        - Validation status
        - Expiration information
        - Issuer details

        Args:
            origin: Target domain for certificate inspection

        Returns:
            Command: CDP command returning certificate data

        Security applications:
        - Certificate validation
        - SSL/TLS verification
        - Security assessment
        - Chain of trust verification
        """
        params = GetCertificateParams(origin=origin)
        return Command(method=NetworkMethod.GET_CERTIFICATE, params=params)

    @staticmethod
    def get_response_body_for_interception(
        interception_id: str,
    ) -> GetResponseBodyForInterceptionCommand:
        """
        Retrieves response body from an intercepted request.

        Essential for:
        - Response modification
        - Content inspection
        - Security testing
        - API response validation

        Args:
            interception_id: Identifier for intercepted request

        Returns:
            Command: CDP command providing intercepted response content

        Note:
        - Must be used with interception enabled
        - Supports streaming responses
        - Handles various content types
        """
        params = GetResponseBodyForInterceptionParams(interceptionId=interception_id)
        return Command(method=NetworkMethod.GET_RESPONSE_BODY_FOR_INTERCEPTION, params=params)

    @staticmethod
    def set_accepted_encodings(
        encodings: list[ContentEncoding],
    ) -> SetAcceptedEncodingsCommand:
        """
        Specifies accepted content encodings for requests.

        Controls:
        - Compression algorithms
        - Transfer encoding
        - Content optimization

        Args:
            encodings: list of accepted encoding methods
                     (gzip, deflate, br, etc.)

        Returns:
            Command: CDP command to set encoding preferences

        Performance implications:
        - Affects bandwidth usage
        - Impacts response time
        - Changes server behavior
        """
        params = SetAcceptedEncodingsParams(encodings=encodings)
        return Command(method=NetworkMethod.SET_ACCEPTED_ENCODINGS, params=params)

    @staticmethod
    def set_attach_debug_stack(enabled: bool) -> SetAttachDebugStackCommand:
        """
        Enables/disables debug stack attachment to requests.

        Debug features:
        - Stack trace collection
        - Request origin tracking
        - Initialization context
        - Call site identification

        Args:
            enabled: True to attach debug info, False to disable

        Returns:
            Command: CDP command to configure debug stack attachment

        Performance note:
        - May impact performance when enabled
        - Useful for development/debugging
        - Consider memory usage
        """
        params = SetAttachDebugStackParams(enabled=enabled)
        return Command(method=NetworkMethod.SET_ATTACH_DEBUG_STACK, params=params)

    @staticmethod
    def set_cookie_controls(
        enable_third_party_cookie_restriction: bool,
        disable_third_party_cookie_metadata: Optional[bool] = None,
        disable_third_party_cookie_heuristics: Optional[bool] = None,
    ) -> SetCookieControlsCommand:
        """
        Configures third-party cookie handling policies.

        Privacy features:
        - Cookie access control
        - Third-party restrictions
        - Tracking prevention
        - Privacy policy enforcement

        Args:
            enable_third_party_cookie_restriction: Enable restrictions
            disable_third_party_cookie_metadata: Skip metadata checks
            disable_third_party_cookie_heuristics: Disable detection logic

        Returns:
            Command: CDP command to set cookie control policies

        Security implications:
        - Affects cross-site tracking
        - Changes authentication behavior
        - Impacts embedded content
        """
        params = SetCookieControlsParams(
            enableThirdPartyCookieRestriction=enable_third_party_cookie_restriction
        )
        if disable_third_party_cookie_metadata is not None:
            params['disableThirdPartyCookieMetadata'] = disable_third_party_cookie_metadata
        if disable_third_party_cookie_heuristics is not None:
            params['disableThirdPartyCookieHeuristics'] = disable_third_party_cookie_heuristics
        return Command(method=NetworkMethod.SET_COOKIE_CONTROLS, params=params)

    @staticmethod
    def stream_resource_content(
        request_id: str,
    ) -> StreamResourceContentCommand:
        """
        Enables streaming of response content.

        Useful for:
        - Large file downloads
        - Progressive loading
        - Memory optimization
        - Real-time processing

        Args:
            request_id: Target request identifier

        Returns:
            Command: CDP command to initiate content streaming

        Best practices:
        - Monitor memory usage
        - Handle stream chunks efficiently
        - Consider error recovery
        """
        params = StreamResourceContentParams(requestId=request_id)
        return Command(method=NetworkMethod.STREAM_RESOURCE_CONTENT, params=params)

    @staticmethod
    def take_response_body_for_interception_as_stream(
        interception_id: str,
    ) -> TakeResponseBodyForInterceptionAsStreamCommand:
        """
        Creates a stream for intercepted response body.

        Applications:
        - Large response handling
        - Content modification
        - Bandwidth optimization
        - Progressive processing

        Args:
            interception_id: Intercepted response identifier

        Returns:
            Command: CDP command returning stream handle

        Stream handling:
        - Supports chunked transfer
        - Manages memory efficiently
        - Enables real-time processing
        """
        params = TakeResponseBodyForInterceptionAsStreamParams(interceptionId=interception_id)
        return Command(
            method=NetworkMethod.TAKE_RESPONSE_BODY_FOR_INTERCEPTION_AS_STREAM,
            params=params,
        )

    @staticmethod
    def emulate_network_conditions(
        offline: bool,
        latency: float,
        download_throughput: float,
        upload_throughput: float,
        connection_type: Optional[ConnectionType] = None,
        packet_loss: Optional[float] = None,
        packet_queue_length: Optional[int] = None,
        packet_reordering: Optional[bool] = None,
    ) -> EmulateNetworkConditionsCommand:
        """
        Emulates custom network conditions for realistic testing scenarios.

        Simulates various network profiles including:
        - Offline mode
        - High-latency connections
        - Bandwidth throttling
        - Unreliable network characteristics

        Args:
            offline: Simulate complete network disconnection
            latency: Minimum latency in milliseconds (round-trip time)
            download_throughput: Max download speed (bytes/sec, -1 to disable)
            upload_throughput: Max upload speed (bytes/sec, -1 to disable)
            connection_type: Network connection type (cellular, wifi, etc.)
            packet_loss: Simulated packet loss percentage (0-100)
            packet_queue_length: Network buffer size simulation
            packet_reordering: Enable packet order randomization

        Typical use cases:
        - Testing progressive loading states
        - Validating offline-first functionality
        - Performance optimization under constrained networks

        Returns:
            Command: CDP command to activate network emulation
        """
        params = EmulateNetworkConditionsParams(
            offline=offline,
            latency=latency,
            downloadThroughput=download_throughput,
            uploadThroughput=upload_throughput,
        )
        if connection_type is not None:
            params['connectionType'] = connection_type
        if packet_loss is not None:
            params['packetLoss'] = packet_loss
        if packet_queue_length is not None:
            params['packetQueueLength'] = packet_queue_length
        if packet_reordering is not None:
            params['packetReordering'] = packet_reordering
        return Command(method=NetworkMethod.EMULATE_NETWORK_CONDITIONS, params=params)

    @staticmethod
    def get_security_isolation_status(
        frame_id: Optional[str] = None,
    ) -> GetSecurityIsolationStatusCommand:
        """
        Retrieves security isolation information.

        Provides:
        - CORS status
        - Cross-origin isolation
        - Security context
        - Frame isolation

        Args:
            frame_id: Optional frame to check

        Returns:
            Command: CDP command returning isolation status

        Security aspects:
        - Cross-origin policies
        - Iframe security
        - Site isolation
        - Content protection
        """
        params = GetSecurityIsolationStatusParams()
        if frame_id is not None:
            params['frameId'] = frame_id
        return Command(method=NetworkMethod.GET_SECURITY_ISOLATION_STATUS, params=params)

    @staticmethod
    def load_network_resource(
        url: str,
        options: LoadNetworkResourceOptions,
        frame_id: Optional[str] = None,
    ) -> LoadNetworkResourceCommand:
        """
        Loads a network resource with specific options.

        Features:
        - Custom request configuration
        - Resource loading control
        - Frame-specific loading
        - Error handling

        Args:
            url: Resource URL to load
            options: Loading configuration
            frame_id: Target frame context

        Returns:
            Command: CDP command to load resource

        Usage considerations:
        - Respects CORS policies
        - Handles authentication
        - Manages redirects
        - Supports streaming
        """
        params = LoadNetworkResourceParams(url=url, options=options)
        if frame_id is not None:
            params['frameId'] = frame_id
        return Command(method=NetworkMethod.LOAD_NETWORK_RESOURCE, params=params)

    @staticmethod
    def replay_xhr(
        request_id: str,
    ) -> ReplayXHRCommand:
        """
        Replays an XHR request.

        Applications:
        - Request debugging
        - Response testing
        - Race condition analysis
        - API verification

        Args:
            request_id: XHR request to replay

        Returns:
            Command: CDP command to replay XHR

        Note:
        - Maintains original headers
        - Preserves request body
        - Updates timestamps
        - Creates new request ID
        """
        params = ReplayXHRParams(requestId=request_id)
        return Command(method=NetworkMethod.REPLAY_XHR, params=params)


================================================
FILE: pydoll/commands/page_commands.py
================================================
from __future__ import annotations

from typing import TYPE_CHECKING, Literal, Optional

from pydoll.protocol.base import Command
from pydoll.protocol.page.methods import (
    AddCompilationCacheParams,
    AddScriptToEvaluateOnNewDocumentParams,
    CaptureScreenshotParams,
    CaptureSnapshotParams,
    CreateIsolatedWorldParams,
    EnableParams,
    GenerateTestReportParams,
    GetAdScriptAncestryIdsParams,
    GetAppIdParams,
    GetAppManifestParams,
    GetOriginTrialsParams,
    GetPermissionsPolicyStateParams,
    GetResourceContentParams,
    HandleJavaScriptDialogParams,
    NavigateParams,
    NavigateToHistoryEntryParams,
    PageMethod,
    PrintToPDFParams,
    ProduceCompilationCacheParams,
    ReloadParams,
    RemoveScriptToEvaluateOnNewDocumentParams,
    ScreencastFrameAckParams,
    SearchInResourceParams,
    SetAdBlockingEnabledParams,
    SetBypassCSPParams,
    SetDocumentContentParams,
    SetFontFamiliesParams,
    SetFontSizesParams,
    SetInterceptFileChooserDialogParams,
    SetLifecycleEventsEnabledParams,
    SetPrerenderingAllowedParams,
    SetRPHRegistrationModeParams,
    SetSPCTransactionModeParams,
    SetWebLifecycleStateParams,
    StartScreencastParams,
)
from pydoll.protocol.page.types import (
    CompilationCacheParams,
    FontFamilies,
    FontSizes,
    ScriptFontFamilies,
)

if TYPE_CHECKING:
    from pydoll.protocol.page.methods import (
        AddCompilationCacheCommand,
        AddScriptToEvaluateOnNewDocumentCommand,
        BringToFrontCommand,
        CaptureScreenshotCommand,
        CaptureSnapshotCommand,
        ClearCompilationCacheCommand,
        CloseCommand,
        CrashCommand,
        CreateIsolatedWorldCommand,
        DisableCommand,
        EnableCommand,
        GenerateTestReportCommand,
        GetAdScriptAncestryIdsCommand,
        GetAppIdCommand,
        GetAppManifestCommand,
        GetFrameTreeCommand,
        GetInstallabilityErrorsCommand,
        GetLayoutMetricsCommand,
        GetNavigationHistoryCommand,
        GetOriginTrialsCommand,
        GetPermissionsPolicyStateCommand,
        GetResourceContentCommand,
        GetResourceTreeCommand,
        HandleJavaScriptDialogCommand,
        NavigateCommand,
        NavigateToHistoryEntryCommand,
        PrintToPDFCommand,
        ProduceCompilationCacheCommand,
        ReloadCommand,
        RemoveScriptToEvaluateOnNewDocumentCommand,
        ResetNavigationHistoryCommand,
        ScreencastFrameAckCommand,
        SearchInResourceCommand,
        SetAdBlockingEnabledCommand,
        SetBypassCSPCommand,
        SetDocumentContentCommand,
        SetFontFamiliesCommand,
        SetFontSizesCommand,
        SetInterceptFileChooserDialogCommand,
        SetLifecycleEventsEnabledCommand,
        SetPrerenderingAllowedCommand,
        SetRPHRegistrationModeCommand,
        SetSPCTransactionModeCommand,
        SetWebLifecycleStateCommand,
        StartScreencastCommand,
        StopLoadingCommand,
        StopScreencastCommand,
        WaitForDebuggerCommand,
    )
    from pydoll.protocol.page.types import (
        AutoResponseMode,
        ReferrerPolicy,
        ScreencastFormat,
        ScreenshotFormat,
        TransferMode,
        TransitionType,
        Viewport,
        WebLifecycleState,
    )


class PageCommands:
    """
    This class encapsulates the page commands of the Chrome DevTools Protocol (CDP).

    CDP's Page domain allows for interacting with browser pages, including navigation,
    content manipulation, and page state monitoring. These commands provide powerful
    capabilities for web automation, testing, and debugging.

    The commands defined in this class provide functionality for:
    - Navigating to URLs and managing page history
    - Capturing screenshots and generating PDFs
    - Handling JavaScript dialogs
    - Enabling and controlling page events
    - Managing download behavior
    - Manipulating page content and state
    """

    @staticmethod
    def add_script_to_evaluate_on_new_document(
        source: str,
        world_name: Optional[str] = None,
        include_command_line_api: Optional[bool] = None,
        run_immediately: Optional[bool] = None,
    ) -> AddScriptToEvaluateOnNewDocumentCommand:
        """
        Creates a command to add a script that will be evaluated when a new document is created.

        Args:
            source (str): Script source to be evaluated when a new document is created.
            world_name (Optional[str]): If specified, creates an isolated world with the given name.
            include_command_line_api (Optional[bool]): Whether to include command line API.
            run_immediately (Optional[bool]): Whether to run the script immediately on
                existing contexts.

        Returns:
            AddScriptToEvaluateOnNewDocumentCommand: Command object with the identifier
                of the added script.
        """
        params = AddScriptToEvaluateOnNewDocumentParams(source=source)
        if world_name is not None:
            params['worldName'] = world_name
        if include_command_line_api is not None:
            params['includeCommandLineAPI'] = include_command_line_api
        if run_immediately is not None:
            params['runImmediately'] = run_immediately

        return Command(method=PageMethod.ADD_SCRIPT_TO_EVALUATE_ON_NEW_DOCUMENT, params=params)

    @staticmethod
    def bring_to_front() -> BringToFrontCommand:
        """
        Brings the page to front.
        """
        return Command(method=PageMethod.BRING_TO_FRONT)

    @staticmethod
    def capture_screenshot(
        format: Optional[ScreenshotFormat] = None,
        quality: Optional[int] = None,
        clip: Optional[Viewport] = None,
        from_surface: Optional[bool] = None,
        capture_beyond_viewport: Optional[bool] = None,
        optimize_for_speed: Optional[bool] = None,
    ) -> CaptureScreenshotCommand:
        """
        Creates a command to capture a screenshot of the current page.

        Args:
            format (Optional[str]): Image compression format (jpeg, png, or webp).
            quality (Optional[int]): Compression quality from 0-100 (jpeg only).
            clip (Optional[Viewport]): Region of the page to capture.
            from_surface (Optional[bool]): Capture from the surface, not the view.
            capture_beyond_viewport (Optional[bool]): Capture beyond the viewport.
            optimize_for_speed (Optional[bool]): Optimize for speed, not for size.

        Returns:
            CaptureScreenshotCommand: Command object with base64-encoded image data.
        """
        params = CaptureScreenshotParams()
        if format is not None:
            params['format'] = format
        if quality is not None:
            params['quality'] = quality
        if clip is not None:
            params['clip'] = clip
        if from_surface is not None:
            params['fromSurface'] = from_surface
        if capture_beyond_viewport is not None:
            params['captureBeyondViewport'] = capture_beyond_viewport
        if optimize_for_speed is not None:
            params['optimizeForSpeed'] = optimize_for_speed

        return Command(method=PageMethod.CAPTURE_SCREENSHOT, params=params)

    @staticmethod
    def close() -> CloseCommand:
        """
        Creates a command to close the current page.

        Returns:
            CloseCommand: Command object to close the page.
        """
        return Command(method=PageMethod.CLOSE)

    @staticmethod
    def create_isolated_world(
        frame_id: str,
        world_name: Optional[str] = None,
        grant_universal_access: Optional[bool] = None,
    ) -> CreateIsolatedWorldCommand:
        """
        Creates a command to create an isolated world for the given frame.

        Args:
            frame_id (str): ID of the frame in which to create the isolated world.
            world_name (Optional[str]): Name to be reported in the Execution Context.
            grant_universal_access (Optional[bool]): Whether to grant universal access.

        Returns:
            CreateIsolatedWorldCommand: Command object with the execution context ID.
        """
        params = CreateIsolatedWorldParams(frameId=frame_id)
        if world_name is not None:
            params['worldName'] = world_name
        if grant_universal_access is not None:
            params['grantUniveralAccess'] = grant_universal_access

        return Command(method=PageMethod.CREATE_ISOLATED_WORLD, params=params)

    @staticmethod
    def disable() -> DisableCommand:
        """
        Creates a command to disable page domain notifications.

        Returns:
            DisableCommand: Command object to disable the Page domain.
        """
        return Command(method=PageMethod.DISABLE)

    @staticmethod
    def enable(
        enable_file_chooser_opened_event: Optional[bool] = None,
    ) -> EnableCommand:
        """
        Creates a command to enable page domain notifications.

        Args:
            enable_file_chooser_opened_event (Optional[bool]): Whether to emit
                Page.fileChooserOpened event.

        Returns:
            EnableCommand: Command object to enable the Page domain.
        """
        params = EnableParams()
        if enable_file_chooser_opened_event is not None:
            params['enableFileChooserOpenedEvent'] = enable_file_chooser_opened_event

        return Command(method=PageMethod.ENABLE, params=params)

    @staticmethod
    def get_app_manifest(
        manifest_id: Optional[str] = None,
    ) -> GetAppManifestCommand:
        """
        Creates a command to get the manifest for the current document.

        Returns:
            GetAppManifestCommand: Command object with manifest information.
        """
        params = GetAppManifestParams()
        if manifest_id is not None:
            params['manifestId'] = manifest_id
        return Command(method=PageMethod.GET_APP_MANIFEST, params=params)

    @staticmethod
    def get_frame_tree() -> GetFrameTreeCommand:
        """
        Creates a command to get the frame tree for the current page.

        Returns:
            GetFrameTreeCommand: Command object with frame tree information.
        """
        return Command(method=PageMethod.GET_FRAME_TREE)

    @staticmethod
    def get_layout_metrics() -> GetLayoutMetricsCommand:
        """
        Creates a command to get layout metrics for the page.

        Returns:
            GetLayoutMetricsCommand: Command object with layout metrics.
        """
        return Command(method=PageMethod.GET_LAYOUT_METRICS)

    @staticmethod
    def get_navigation_history() -> GetNavigationHistoryCommand:
        """
        Creates a command to get the navigation history for the current page.

        Returns:
            GetNavigationHistoryCommand: Command object with navigation history.
        """
        return Command(method=PageMethod.GET_NAVIGATION_HISTORY)

    @staticmethod
    def handle_javascript_dialog(
        accept: bool, prompt_text: Optional[str] = None
    ) -> HandleJavaScriptDialogCommand:
        """
        Creates a command to handle a JavaScript dialog.

        Args:
            accept (bool): Whether to accept or dismiss the dialog.
            prompt_text (Optional[str]): Text to enter in prompt dialogs.

        Returns:
            HandleJavaScriptDialogCommand: Command object to handle a JavaScript dialog.
        """
        params = HandleJavaScriptDialogParams(accept=accept)
        if prompt_text is not None:
            params['promptText'] = prompt_text

        return Command(method=PageMethod.HANDLE_JAVASCRIPT_DIALOG, params=params)

    @staticmethod
    def navigate(
        url: str,
        referrer: Optional[str] = None,
        transition_type: Optional[TransitionType] = None,
        frame_id: Optional[str] = None,
        referrer_policy: Optional[ReferrerPolicy] = None,
    ) -> NavigateCommand:
        """
        Creates a command to navigate to a specific URL.

        Args:
            url (str): URL to navigate to.
            referrer (Optional[str]): Referrer URL.
            transition_type (Optional[str]): Intended transition type.
            frame_id (Optional[str]): Frame ID to navigate.
            referrer_policy (Optional[str]): Referrer policy.

        Returns:
            NavigateCommand: Command object to navigate to a URL.
        """
        params = NavigateParams(url=url)
        if referrer is not None:
            params['referrer'] = referrer
        if transition_type is not None:
            params['transitionType'] = transition_type
        if frame_id is not None:
            params['frameId'] = frame_id
        if referrer_policy is not None:
            params['referrerPolicy'] = referrer_policy

        return Command(method=PageMethod.NAVIGATE, params=params)

    @staticmethod
    def navigate_to_history_entry(entry_id: int) -> NavigateToHistoryEntryCommand:
        """
        Creates a command to navigate to a specific history entry.

        Args:
            entry_id (int): ID of the history entry to navigate to.

        Returns:
            NavigateToHistoryEntryCommand: Command object to navigate to a history entry.
        """
        params = NavigateToHistoryEntryParams(entryId=entry_id)
        return Command(method=PageMethod.NAVIGATE_TO_HISTORY_ENTRY, params=params)

    @staticmethod
    def print_to_pdf(  # noqa: PLR0912
        landscape: Optional[bool] = None,
        display_header_footer: Optional[bool] = None,
        print_background: Optional[bool] = None,
        scale: Optional[float] = None,
        paper_width: Optional[float] = None,
        paper_height: Optional[float] = None,
        margin_top: Optional[float] = None,
        margin_bottom: Optional[float] = None,
        margin_left: Optional[float] = None,
        margin_right: Optional[float] = None,
        page_ranges: Optional[str] = None,
        header_template: Optional[str] = None,
        footer_template: Optional[str] = None,
        prefer_css_page_size: Optional[bool] = None,
        transfer_mode: Optional[TransferMode] = None,
        generate_tagged_pdf: Optional[bool] = None,
        generate_document_outline: Optional[bool] = None,
    ) -> PrintToPDFCommand:
        """
        Creates a command to print the current page to PDF.

        Args:
            landscape (Optional[bool]): Paper orientation.
            display_header_footer (Optional[bool]): Display header and footer.
            print_background (Optional[bool]): Print background graphics.
            scale (Optional[float]): Scale of the webpage rendering.
            paper_width (Optional[float]): Paper width in inches.
            paper_height (Optional[float]): Paper height in inches.
            margin_top (Optional[float]): Top margin in inches.
            margin_bottom (Optional[float]): Bottom margin in inches.
            margin_left (Optional[float]): Left margin in inches.
            margin_right (Optional[float]): Right margin in inches.
            page_ranges (Optional[str]): Paper ranges to print, e.g., '1-5, 8, 11-13'.
            header_template (Optional[str]): HTML template for the print header.
            footer_template (Optional[str]): HTML template for the print footer.
            prefer_css_page_size (Optional[bool]): Whether to prefer page size as defined by CSS.
            transfer_mode (Optional[str]): Transfer mode.

        Returns:
            PrintToPDFCommand: Command object to print the page to PDF.
        """
        params = PrintToPDFParams()
        if landscape is not None:
            params['landscape'] = landscape
        if display_header_footer is not None:
            params['displayHeaderFooter'] = display_header_footer
        if print_background is not None:
            params['printBackground'] = print_background
        if scale is not None:
            params['scale'] = scale
        if paper_width is not None:
            params['paperWidth'] = paper_width
        if paper_height is not None:
            params['paperHeight'] = paper_height
        if margin_top is not None:
            params['marginTop'] = margin_top
        if margin_bottom is not None:
            params['marginBottom'] = margin_bottom
        if margin_left is not None:
            params['marginLeft'] = margin_left
        if margin_right is not None:
            params['marginRight'] = margin_right
        if page_ranges is not None:
            params['pageRanges'] = page_ranges
        if header_template is not None:
            params['headerTemplate'] = header_template
        if footer_template is not None:
            params['footerTemplate'] = footer_template
        if prefer_css_page_size is not None:
            params['preferCSSPageSize'] = prefer_css_page_size
        if transfer_mode is not None:
            params['transferMode'] = transfer_mode
        if generate_tagged_pdf is not None:
            params['generateTaggedPDF'] = generate_tagged_pdf
        if generate_document_outline is not None:
            params['generateDocumentOutline'] = generate_document_outline

        return Command(method=PageMethod.PRINT_TO_PDF, params=params)

    @staticmethod
    def reload(
        ignore_cache: Optional[bool] = None,
        script_to_evaluate_on_load: Optional[str] = None,
        loader_id: Optional[str] = None,
    ) -> ReloadCommand:
        """
        Creates a command to reload the current page.

        Args:
            ignore_cache (Optional[bool]): If true, browser cache is ignored.
            script_to_evaluate_on_load (Optional[str]): Script to be injected into the page on load.

        Returns:
            ReloadCommand: Command object to reload the page.
        """
        params = ReloadParams()
        if ignore_cache is not None:
            params['ignoreCache'] = ignore_cache
        if script_to_evaluate_on_load is not None:
            params['scriptToEvaluateOnLoad'] = script_to_evaluate_on_load
        if loader_id is not None:
            params['loaderId'] = loader_id

        return Command(method=PageMethod.RELOAD, params=params)

    @staticmethod
    def reset_navigation_history() -> ResetNavigationHistoryCommand:
        """
        Creates a command to reset the navigation history.
        """
        return Command(method=PageMethod.RESET_NAVIGATION_HISTORY)

    @staticmethod
    def remove_script_to_evaluate_on_new_document(
        identifier: str,
    ) -> RemoveScriptToEvaluateOnNewDocumentCommand:
        """
        Creates a command to remove a script that was added to be evaluated on new documents.

        Args:
            identifier (str): Identifier of the script to remove.

        Returns:
            RemoveScriptToEvaluateOnNewDocumentCommand: Command object to remove a script.
        """
        params = RemoveScriptToEvaluateOnNewDocumentParams(identifier=identifier)
        return Command(method=PageMethod.REMOVE_SCRIPT_TO_EVALUATE_ON_NEW_DOCUMENT, params=params)

    @staticmethod
    def set_bypass_csp(enabled: bool) -> SetBypassCSPCommand:
        """
        Creates a command to toggle bypassing page CSP.

        Args:
            enabled (bool): Whether to bypass page CSP.

        Returns:
            SetBypassCSPCommand: Command object to toggle bypassing page CSP.
        """
        params = SetBypassCSPParams(enabled=enabled)
        return Command(method=PageMethod.SET_BYPASS_CSP, params=params)

    @staticmethod
    def set_document_content(frame_id: str, html: str) -> SetDocumentContentCommand:
        """
        Creates a command to set the document content of a frame.

        Args:
            frame_id (str): Frame ID to set the document content for.
            html (str): HTML content to set.

        Returns:
            SetDocumentContentCommand: Command object to set the document content.
        """
        params = SetDocumentContentParams(frameId=frame_id, html=html)
        return Command(method=PageMethod.SET_DOCUMENT_CONTENT, params=params)

    @staticmethod
    def set_intercept_file_chooser_dialog(enabled: bool) -> SetInterceptFileChooserDialogCommand:
        """
        Creates a command to set whether to intercept file chooser dialogs.

        Args:
            enabled (bool): Whether to intercept file chooser dialogs.

        Returns:
            SetInterceptFileChooserDialogCommand: Command object to set file chooser dialog
                interception.
        """
        params = SetInterceptFileChooserDialogParams(enabled=enabled)
        return Command(method=PageMethod.SET_INTERCEPT_FILE_CHOOSER_DIALOG, params=params)

    @staticmethod
    def set_lifecycle_events_enabled(enabled: bool) -> SetLifecycleEventsEnabledCommand:
        """
        Creates a command to enable/disable lifecycle events.

        Args:
            enabled (bool): Whether to enable lifecycle events.

        Returns:
            SetLifecycleEventsEnabledCommand: Command object to enable/disable lifecycle events.
        """
        params = SetLifecycleEventsEnabledParams(enabled=enabled)
        return Command(method=PageMethod.SET_LIFECYCLE_EVENTS_ENABLED, params=params)

    @staticmethod
    def stop_loading() -> StopLoadingCommand:
        """
        Creates a command to stop loading the page.

        Returns:
            StopLoadingCommand: Command object to stop loading the page.
        """
        return Command(method=PageMethod.STOP_LOADING)

    @staticmethod
    def add_compilation_cache(url: str, data: str) -> AddCompilationCacheCommand:
        """
        Creates a command to add a compilation cache entry.

        Experimental: This method is experimental and may be subject to change.

        Args:
            url (str): URL for which to add the compilation cache entry.
            data (str): Base64-encoded data.

        Returns:
            AddCompilationCacheCommand: Command object to add a compilation cache entry.
        """
        params = AddCompilationCacheParams(url=url, data=data)
        return Command(method=PageMethod.ADD_COMPILATION_CACHE, params=params)

    @staticmethod
    def capture_snapshot(
        format: Literal['mhtml'] = 'mhtml',
    ) -> CaptureSnapshotCommand:
        """
        Creates a command to capture a snapshot of the page.

        Experimental: This method is experimental and may be subject to change.

        Args:
            format (Literal['mhtml']): Format of the snapshot (only 'mhtml' is supported).

        Returns:
            CaptureSnapshotCommand: Command object to capture a snapshot.
        """
        params = CaptureSnapshotParams(format=format)
        return Command(method=PageMethod.CAPTURE_SNAPSHOT, params=params)

    @staticmethod
    def clear_compilation_cache() -> ClearCompilationCacheCommand:
        """
        Creates a command to clear the compilation cache.
        """
        return Command(method=PageMethod.CLEAR_COMPILATION_CACHE)

    @staticmethod
    def crash() -> CrashCommand:
        """
        Creates a command to crash the page.
        """
        return Command(method=PageMethod.CRASH)

    @staticmethod
    def generate_test_report(
        message: str, group: Optional[str] = None
    ) -> GenerateTestReportCommand:
        """
        Creates a command to generate a test report.

        Experimental: This method is experimental and may be subject to change.

        Args:
            message (str): Message to be displayed in the report.
            group (Optional[str]): Group label for the report.

        Returns:
            GenerateTestReportCommand: Command object to generate a test report.
        """
        params = GenerateTestReportParams(message=message)
        if group is not None:
            params['group'] = group
        return Command(method=PageMethod.GENERATE_TEST_REPORT, params=params)

    @staticmethod
    def get_ad_script_ancestry_ids(
        frame_id: str,
    ) -> GetAdScriptAncestryIdsCommand:
        """
        Creates a command to get the ad script ancestry IDs for a given frame.

        Experimental: This method is experimental and may be subject to change.

        Args:
            frame_id (str): ID of the frame to get ad script ancestry IDs for.

        Returns:
            GetAdScriptAncestryIdsCommand: Command object to get ad script ancestry IDs.
        """
        params = GetAdScriptAncestryIdsParams(frameId=frame_id)
        return Command(method=PageMethod.GET_AD_SCRIPT_ANCESTRY_IDS, params=params)

    @staticmethod
    def get_app_id(
        app_id: Optional[str] = None, recommended_id: Optional[str] = None
    ) -> GetAppIdCommand:
        """
        Creates a command to get the app ID.

        Experimental: This method is experimental and may be subject to change.

        Args:
            app_id (Optional[str]): App ID for verification.
            recommended_id (Optional[str]): Recommended app ID.

        Returns:
            GetAppIdCommand: Command object to get the app ID.
        """
        params = GetAppIdParams()
        if app_id is not None:
            params['appId'] = app_id
        if recommended_id is not None:
            params['recommendedId'] = recommended_id
        return Command(method=PageMethod.GET_APP_ID, params=params)

    @staticmethod
    def get_installability_errors() -> GetInstallabilityErrorsCommand:
        """
        Creates a command to get the installability errors.
        """
        return Command(method=PageMethod.GET_INSTALLABILITY_ERRORS)

    @staticmethod
    def get_origin_trials(frame_id: str) -> GetOriginTrialsCommand:
        """
        Creates a command to get origin trials for a given origin.

        Experimental: This method is experimental and may be subject to change.

        Args:
            frame_id (Optional[str]): Frame ID to get trials for.

        Returns:
            GetOriginTrialsCommand: Command object to get origin trials.
        """
        params = GetOriginTrialsParams(frameId=frame_id)
        return Command(method=PageMethod.GET_ORIGIN_TRIALS, params=params)

    @staticmethod
    def get_permissions_policy_state(
        frame_id: str,
    ) -> GetPermissionsPolicyStateCommand:
        """
        Creates a command to get the permissions policy state.
        """
        params = GetPermissionsPolicyStateParams(frameId=frame_id)
        return Command(method=PageMethod.GET_PERMISSIONS_POLICY_STATE, params=params)

    @staticmethod
    def get_resource_content(
        frame_id: str,
        url: str,
    ) -> GetResourceContentCommand:
        """
        Creates a command to get the resource content.
        """
        params = GetResourceContentParams(frameId=frame_id, url=url)
        return Command(method=PageMethod.GET_RESOURCE_CONTENT, params=params)

    @staticmethod
    def get_resource_tree() -> GetResourceTreeCommand:
        """
        Creates a command to get the resource tree.
        """
        return Command(method=PageMethod.GET_RESOURCE_TREE)

    @staticmethod
    def produce_compilation_cache(
        scripts: list[CompilationCacheParams],
    ) -> ProduceCompilationCacheCommand:
        """
        Creates a command to produce a compilation cache entry.
        """
        params = ProduceCompilationCacheParams(scripts=scripts)
        return Command(method=PageMethod.PRODUCE_COMPILATION_CACHE, params=params)

    @staticmethod
    def screencast_frame_ack(
        session_id: int,
    ) -> ScreencastFrameAckCommand:
        """
        Creates a command to acknowledge a screencast frame.
        """
        params = ScreencastFrameAckParams(sessionId=session_id)
        return Command(method=PageMethod.SCREENCAST_FRAME_ACK, params=params)

    @staticmethod
    def search_in_resource(
        frame_id: str,
        url: str,
        query: str,
        case_sensitive: Optional[bool] = None,
        is_regex: Optional[bool] = None,
    ) -> SearchInResourceCommand:
        """
        Creates a command to search for a string in a resource.
        """
        params = SearchInResourceParams(frameId=frame_id, url=url, query=query)
        if case_sensitive is not None:
            params['caseSensitive'] = case_sensitive
        if is_regex is not None:
            params['isRegex'] = is_regex
        return Command(method=PageMethod.SEARCH_IN_RESOURCE, params=params)

    @staticmethod
    def set_ad_blocking_enabled(
        enabled: bool,
    ) -> SetAdBlockingEnabledCommand:
        """
        Creates a command to set ad blocking enabled.
        """
        params = SetAdBlockingEnabledParams(enabled=enabled)
        return Command(method=PageMethod.SET_AD_BLOCKING_ENABLED, params=params)

    @staticmethod
    def set_font_families(
        font_families: FontFamilies,
        for_scripts: list[ScriptFontFamilies],
    ) -> SetFontFamiliesCommand:
        """
        Creates a command to set font families.
        """
        params = SetFontFamiliesParams(fontFamilies=font_families, forScripts=for_scripts)
        return Command(method=PageMethod.SET_FONT_FAMILIES, params=params)

    @staticmethod
    def set_font_sizes(
        font_sizes: FontSizes,
    ) -> SetFontSizesCommand:
        """
        Creates a command to set font sizes.
        """
        params = SetFontSizesParams(fontSizes=font_sizes)
        return Command(method=PageMethod.SET_FONT_SIZES, params=params)

    @staticmethod
    def set_prerendering_allowed(
        is_allowed: bool,
    ) -> SetPrerenderingAllowedCommand:
        """
        Creates a command to set prerendering allowed.
        """
        params = SetPrerenderingAllowedParams(isAllowed=is_allowed)
        return Command(method=PageMethod.SET_PRERENDERING_ALLOWED, params=params)

    @staticmethod
    def set_rph_registration_mode(
        mode: AutoResponseMode,
    ) -> SetRPHRegistrationModeCommand:
        """
        Creates a command to set the RPH registration mode.
        """
        params = SetRPHRegistrationModeParams(mode=mode)
        return Command(method=PageMethod.SET_RPH_REGISTRATION_MODE, params=params)

    @staticmethod
    def set_spc_transaction_mode(
        mode: AutoResponseMode,
    ) -> SetSPCTransactionModeCommand:
        """
        Creates a command to set the SPC transaction mode.
        """
        params = SetSPCTransactionModeParams(mode=mode)
        return Command(method=PageMethod.SET_SPC_TRANSACTION_MODE, params=params)

    @staticmethod
    def set_web_lifecycle_state(
        state: WebLifecycleState,
    ) -> SetWebLifecycleStateCommand:
        """
        Creates a command to set the web lifecycle state.
        """
        params = SetWebLifecycleStateParams(state=state)
        return Command(method=PageMethod.SET_WEB_LIFECYCLE_STATE, params=params)

    @staticmethod
    def start_screencast(
        format: ScreencastFormat,
        quality: Optional[int] = None,
        max_width: Optional[int] = None,
        max_height: Optional[int] = None,
        every_nth_frame: Optional[int] = None,
    ) -> StartScreencastCommand:
        """
        Creates a command to start a screencast.
        """
        params = StartScreencastParams(format=format)
        if quality is not None:
            params['quality'] = quality
        if max_width is not None:
            params['maxWidth'] = max_width
        if max_height is not None:
            params['maxHeight'] = max_height
        if every_nth_frame is not None:
            params['everyNthFrame'] = every_nth_frame
        return Command(method=PageMethod.START_SCREENCAST, params=params)

    @staticmethod
    def stop_screencast() -> StopScreencastCommand:
        """
        Creates a command to stop a screencast.
        """
        return Command(method=PageMethod.STOP_SCREENCAST)

    @staticmethod
    def wait_for_debugger() -> WaitForDebuggerCommand:
        """
        Creates a command to wait for a debugger.
        """
        return Command(method=PageMethod.WAIT_FOR_DEBUGGER)


================================================
FILE: pydoll/commands/runtime_commands.py
================================================
from __future__ import annotations

from typing import TYPE_CHECKING, Optional

from pydoll.protocol.base import Command
from pydoll.protocol.runtime.methods import (
    AddBindingParams,
    AwaitPromiseParams,
    CallFunctionOnParams,
    CompileScriptParams,
    EvaluateParams,
    GetPropertiesParams,
    GlobalLexicalScopeNamesParams,
    QueryObjectsParams,
    ReleaseObjectGroupParams,
    ReleaseObjectParams,
    RemoveBindingParams,
    RunScriptParams,
    RuntimeMethod,
    SetAsyncCallStackDepthParams,
    SetCustomObjectFormatterEnabledParams,
    SetMaxCallStackSizeToCaptureParams,
)

if TYPE_CHECKING:
    from pydoll.protocol.runtime.methods import (
        AddBindingCommand,
        AwaitPromiseCommand,
        CallArgument,
        CallFunctionOnCommand,
        CompileScriptCommand,
        DisableCommand,
        EnableCommand,
        EvaluateCommand,
        GetPropertiesCommand,
        GlobalLexicalScopeNamesCommand,
        QueryObjectsCommand,
        ReleaseObjectCommand,
        ReleaseObjectGroupCommand,
        RemoveBindingCommand,
        RunScriptCommand,
        SerializationOptions,
        SetAsyncCallStackDepthCommand,
        SetCustomObjectFormatterEnabledCommand,
        SetMaxCallStackSizeToCaptureCommand,
    )


class RuntimeCommands:
    """
    A class for interacting with the JavaScript runtime using Chrome
    DevTools Protocol.

    This class provides methods to create commands for evaluating JavaScript
    expressions, calling functions on JavaScript objects, and retrieving
    object properties through CDP.

    Attributes:
        EVALUATE_TEMPLATE (dict): Template for the Runtime.evaluate command.
        CALL_FUNCTION_ON_TEMPLATE (dict): Template for the
            Runtime.callFunctionOn command.
        GET_PROPERTIES (dict): Template for the Runtime.getProperties command.
    """

    @staticmethod
    def add_binding(name: str, execution_context_name: Optional[str] = None) -> AddBindingCommand:
        """
        Creates a command to add a JavaScript binding.

        Args:
            name (str): Name of the binding to add.
            execution_context_name (Optional[str]): Name of the execution context to bind to.

        Returns:
            AddBindingCommand: Command object to add a JavaScript binding.
        """
        params = AddBindingParams(name=name)
        if execution_context_name is not None:
            params['executionContextName'] = execution_context_name

        return Command(method=RuntimeMethod.ADD_BINDING, params=params)

    @staticmethod
    def await_promise(
        promise_object_id: str,
        return_by_value: Optional[bool] = None,
        generate_preview: Optional[bool] = None,
    ) -> AwaitPromiseCommand:
        """
        Creates a command to await a JavaScript promise and return its result.

        Args:
            promise_object_id (str): ID of the promise to await.
            return_by_value (Optional[bool]): Whether to return the result by value instead
                of reference.
            generate_preview (Optional[bool]): Whether to generate a preview for the result.

        Returns:
            AwaitPromiseCommand: Command object to await a promise.
        """
        params = AwaitPromiseParams(promiseObjectId=promise_object_id)
        if return_by_value is not None:
            params['returnByValue'] = return_by_value
        if generate_preview is not None:
            params['generatePreview'] = generate_preview

        return Command(method=RuntimeMethod.AWAIT_PROMISE, params=params)

    @staticmethod
    def call_function_on(
        function_declaration: str,
        object_id: Optional[str] = None,
        arguments: Optional[list[CallArgument]] = None,
        silent: Optional[bool] = None,
        return_by_value: Optional[bool] = None,
        generate_preview: Optional[bool] = None,
        user_gesture: Optional[bool] = None,
        await_promise: Optional[bool] = None,
        execution_context_id: Optional[int] = None,
        object_group: Optional[str] = None,
        throw_on_side_effect: Optional[bool] = None,
        unique_context_id: Optional[str] = None,
        serialization_options: Optional[SerializationOptions] = None,
    ) -> CallFunctionOnCommand:
        """
        Creates a command to call a function with a given declaration on a specific object.

        Args:
            function_declaration (str): Declaration of the function to call.
            object_id (Optional[str]): ID of the object to call the function on.
            arguments (Optional[list[CallArgument]]): Arguments to pass to the function.
            silent (Optional[bool]): Whether to silence exceptions.
            return_by_value (Optional[bool]): Whether to return the result by value instead
                of reference.
            generate_preview (Optional[bool]): Whether to generate a preview for the result.
            user_gesture (Optional[bool]): Whether to treat the call as initiated by user gesture.
            await_promise (Optional[bool]): Whether to await promise result.
            execution_context_id (Optional[int]): ID of the execution context to call the
                function in.
            object_group (Optional[str]): Symbolic group name for the result.
            throw_on_side_effect (Optional[bool]): Whether to throw if side effect cannot be
                ruled out.
            unique_context_id (Optional[str]): Unique context ID for the function call.
            serialization_options (Optional[SerializationOptions]): Serialization options for
                the result.

        Returns:
            CallFunctionOnCommand: Command object to call a function on an object.
        """
        params = CallFunctionOnParams(functionDeclaration=function_declaration)
        if object_id is not None:
            params['objectId'] = object_id
        if arguments is not None:
            params['arguments'] = arguments
        if silent is not None:
            params['silent'] = silent
        if return_by_value is not None:
            params['returnByValue'] = return_by_value
        if generate_preview is not None:
            params['generatePreview'] = generate_preview
        if user_gesture is not None:
            params['userGesture'] = user_gesture
        if await_promise is not None:
            params['awaitPromise'] = await_promise
        if execution_context_id is not None:
            params['executionContextId'] = execution_context_id
        if object_group is not None:
            params['objectGroup'] = object_group
        if throw_on_side_effect is not None:
            params['throwOnSideEffect'] = throw_on_side_effect
        if unique_context_id is not None:
            params['uniqueContextId'] = unique_context_id
        if serialization_options is not None:
            params['serializationOptions'] = serialization_options

        return Command(method=RuntimeMethod.CALL_FUNCTION_ON, params=params)

    @staticmethod
    def compile_script(
        expression: str,
        source_url: str,
        persist_script: bool = False,
        execution_context_id: Optional[int] = None,
    ) -> CompileScriptCommand:
        """
        Creates a command to compile a JavaScript expression.

        Args:
            expression (str): JavaScript expression to compile.
            source_url (str): URL of the source file for the script.
            persist_script (bool): Whether to persist the compiled script.
            execution_context_id (Optional[int]): ID of the execution context to compile
                the script in.

        Returns:
            CompileScriptCommand: Command object to compile a script.
        """
        params = CompileScriptParams(
            expression=expression, sourceURL=source_url, persistScript=persist_script
        )
        if execution_context_id is not None:
            params['executionContextId'] = execution_context_id

        return Command(method=RuntimeMethod.COMPILE_SCRIPT, params=params)

    @staticmethod
    def disable() -> DisableCommand:
        """
        Disables the runtime domain.

        Returns:
            DisableCommand: Command object to disable the runtime domain.
        """
        return Command(method=RuntimeMethod.DISABLE)

    @staticmethod
    def enable() -> EnableCommand:
        """
        Enables the runtime domain.

        Returns:
            EnableCommand: Command object to enable the runtime domain.
        """
        return Command(method=RuntimeMethod.ENABLE)

    @staticmethod
    def evaluate(  # noqa: PLR0912
        expression: str,
        object_group: Optional[str] = None,
        include_command_line_api: Optional[bool] = None,
        silent: Optional[bool] = None,
        context_id: Optional[int] = None,
        return_by_value: Optional[bool] = None,
        generate_preview: Optional[bool] = None,
        user_gesture: Optional[bool] = None,
        await_promise: Optional[bool] = None,
        throw_on_side_effect: Optional[bool] = None,
        timeout: Optional[float] = None,
        disable_breaks: Optional[bool] = None,
        repl_mode: Optional[bool] = None,
        allow_unsafe_eval_blocked_by_csp: Optional[bool] = None,
        unique_context_id: Optional[str] = None,
        serialization_options: Optional[SerializationOptions] = None,
    ) -> EvaluateCommand:
        """
        Creates a command to evaluate a JavaScript expression in the global context.

        Args:
            expression (str): JavaScript expression to evaluate.
            object_group (Optional[str]): Symbolic group name for the result.
            include_command_line_api (Optional[bool]): Whether to include command line API.
            silent (Optional[bool]): Whether to silence exceptions.
            context_id (Optional[int]): ID of the execution context to evaluate in.
            return_by_value (Optional[bool]): Whether to return the result by value instead
                of reference.
            generate_preview (Optional[bool]): Whether to generate a preview for the result.
            user_gesture (Optional[bool]): Whether to treat evaluation as initiated by user gesture.
            await_promise (Optional[bool]): Whether to await promise result.
            throw_on_side_effect (Optional[bool]): Whether to throw if side effect cannot be
                ruled out.
            timeout (Optional[float]): Timeout in milliseconds.
            disable_breaks (Optional[bool]): Whether to disable breakpoints during evaluation.
            repl_mode (Optional[bool]): Whether to execute in REPL mode.
            allow_unsafe_eval_blocked_by_csp (Optional[bool]): Allow unsafe evaluation.
            unique_context_id (Optional[str]): Unique context ID for evaluation.
            serialization_options (Optional[SerializationOptions]): Serialization
                for the result.

        Returns:
            EvaluateCommand: Command object to evaluate JavaScript.
        """
        params = EvaluateParams(expression=expression)
        if object_group is not None:
            params['objectGroup'] = object_group
        if include_command_line_api is not None:
            params['includeCommandLineAPI'] = include_command_line_api
        if silent is not None:
            params['silent'] = silent
        if context_id is not None:
            params['contextId'] = context_id
        if return_by_value is not None:
            params['returnByValue'] = return_by_value
        if generate_preview is not None:
            params['generatePreview'] = generate_preview
        if user_gesture is not None:
            params['userGesture'] = user_gesture
        if await_promise is not None:
            params['awaitPromise'] = await_promise
        if throw_on_side_effect is not None:
            params['throwOnSideEffect'] = throw_on_side_effect
        if timeout is not None:
            params['timeout'] = timeout
        if disable_breaks is not None:
            params['disableBreaks'] = disable_breaks
        if repl_mode is not None:
            params['replMode'] = repl_mode
        if allow_unsafe_eval_blocked_by_csp is not None:
            params['allowUnsafeEvalBlockedByCSP'] = allow_unsafe_eval_blocked_by_csp
        if unique_context_id is not None:
            params['uniqueContextId'] = unique_context_id
        if serialization_options is not None:
            params['serializationOptions'] = serialization_options

        return Command(method=RuntimeMethod.EVALUATE, params=params)

    @staticmethod
    def get_properties(
        object_id: str,
        own_properties: Optional[bool] = None,
        accessor_properties_only: Optional[bool] = None,
        generate_preview: Optional[bool] = None,
        non_indexed_properties_only: Optional[bool] = None,
    ) -> GetPropertiesCommand:
        """
        Creates a command to get properties of a JavaScript object.

        Args:
            object_id (str): ID of the object to get properties for.
            own_properties (Optional[bool]): Whether to return only own properties.
            accessor_properties_only (Optional[bool]): Whether to return only accessor properties.
            generate_preview (Optional[bool]): Whether to generate previews for property values.
            non_indexed_properties_only (Optional[bool]): Whether to return only non-indexed
                properties.

        Returns:
            GetPropertiesCommand: Command object to get object properties.
        """
        params = GetPropertiesParams(objectId=object_id)
        if own_properties is not None:
            params['ownProperties'] = own_properties
        if accessor_properties_only is not None:
            params['accessorPropertiesOnly'] = accessor_properties_only
        if generate_preview is not None:
            params['generatePreview'] = generate_preview
        if non_indexed_properties_only is not None:
            params['nonIndexedPropertiesOnly'] = non_indexed_properties_only

        return Command(method=RuntimeMethod.GET_PROPERTIES, params=params)

    @staticmethod
    def global_lexical_scope_names(
        execution_context_id: Optional[int] = None,
    ) -> GlobalLexicalScopeNamesCommand:
        """
        Creates a command to retrieve names of variables from global lexical scope.

        Args:
            execution_context_id (Optional[int]): ID of the execution context to get scope
                names from.

        Returns:
            GlobalLexicalScopeNamesCommand: Command object to get global lexical
                scope names.
        """
        params = GlobalLexicalScopeNamesParams()
        if execution_context_id is not None:
            params['executionContextId'] = execution_context_id

        return Command(method=RuntimeMethod.GLOBAL_LEXICAL_SCOPE_NAMES, params=params)

    @staticmethod
    def query_objects(
        prototype_object_id: str,
        object_group: Optional[str] = None,
    ) -> QueryObjectsCommand:
        """
        Creates a command to query objects with a given prototype.

        Args:
            prototype_object_id (str): ID of the prototype object.
            object_group (Optional[str]): Symbolic group name for the results.

        Returns:
            QueryObjectsCommand: Command object to query objects.
        """
        params = QueryObjectsParams(prototypeObjectId=prototype_object_id)
        if object_group is not None:
            params['objectGroup'] = object_group

        return Command(method=RuntimeMethod.QUERY_OBJECTS, params=params)

    @staticmethod
    def release_object(
        object_id: str,
    ) -> ReleaseObjectCommand:
        """
        Creates a command to release a JavaScript object.

        Args:
            object_id (str): ID of the object to release.

        Returns:
            ReleaseObjectCommand: Command object to release an object.
        """
        params = ReleaseObjectParams(objectId=object_id)

        return Command(method=RuntimeMethod.RELEASE_OBJECT, params=params)

    @staticmethod
    def release_object_group(
        object_group: str,
    ) -> ReleaseObjectGroupCommand:
        """
        Creates a command to release all objects in a group.

        Args:
            object_group (str): Name of the object group to release.

        Returns:
            ReleaseObjectGroupCommand: Command object to release an object group.
        """
        params = ReleaseObjectGroupParams(objectGroup=object_group)
        return Command(method=RuntimeMethod.RELEASE_OBJECT_GROUP, params=params)

    @staticmethod
    def remove_binding(
        name: str,
    ) -> RemoveBindingCommand:
        """
        Creates a command to remove a JavaScript binding.

        Args:
            name (str): Name of the binding to remove.

        Returns:
            RemoveBindingCommand: Command object to remove a JavaScript binding.
        """
        params = RemoveBindingParams(name=name)
        return Command(method=RuntimeMethod.REMOVE_BINDING, params=params)

    @staticmethod
    def run_script(
        script_id: str,
        execution_context_id: Optional[int] = None,
        object_group: Optional[str] = None,
        silent: Optional[bool] = None,
        include_command_line_api: Optional[bool] = None,
        return_by_value: Optional[bool] = None,
        generate_preview: Optional[bool] = None,
        await_promise: Optional[bool] = None,
    ) -> RunScriptCommand:
        """
        Creates a command to run a compiled script.

        Args:
            script_id (str): ID of the compiled script to run.
            execution_context_id (Optional[int]): ID of the execution context to run the script in.
            object_group (Optional[str]): Symbolic group name for the result.
            silent (Optional[bool]): Whether to silence exceptions.
            include_command_line_api (Optional[bool]): Whether to include command line API.
            return_by_value (Optional[bool]): Whether to return the result by value instead
                of reference.
            generate_preview (Optional[bool]): Whether to generate a preview for the result.
            await_promise (Optional[bool]): Whether to await promise result.

        Returns:
            RunScriptCommand: Command object to run a script.
        """
        params = RunScriptParams(scriptId=script_id)
        if execution_context_id is not None:
            params['executionContextId'] = execution_context_id
        if object_group is not None:
            params['objectGroup'] = object_group
        if silent is not None:
            params['silent'] = silent
        if include_command_line_api is not None:
            params['includeCommandLineAPI'] = include_command_line_api
        if return_by_value is not None:
            params['returnByValue'] = return_by_value
        if generate_preview is not None:
            params['generatePreview'] = generate_preview
        if await_promise is not None:
            params['awaitPromise'] = await_promise

        return Command(method=RuntimeMethod.RUN_SCRIPT, params=params)

    @staticmethod
    def set_async_call_stack_depth(
        max_depth: int,
    ) -> SetAsyncCallStackDepthCommand:
        """
        Creates a command to set the async call stack depth.

        Args:
            max_depth (int): Maximum depth of async call stacks.

        Returns:
            SetAsyncCallStackDepthCommand: Command object to set async call stack depth.
        """
        params = SetAsyncCallStackDepthParams(maxDepth=max_depth)
        return Command(method=RuntimeMethod.SET_ASYNC_CALL_STACK_DEPTH, params=params)

    @staticmethod
    def set_custom_object_formatter_enabled(
        enabled: bool,
    ) -> SetCustomObjectFormatterEnabledCommand:
        """
        Creates a command to enable or disable custom object formatters.

        Args:
            enabled (bool): Whether to enable custom object formatters.

        Returns:
            SetCustomObjectFormatterEnabledCommand: Command object to enable/disable custom
                object formatters.
        """
        params = SetCustomObjectFormatterEnabledParams(enabled=enabled)
        return Command(method=RuntimeMethod.SET_CUSTOM_OBJECT_FORMATTER_ENABLED, params=params)

    @staticmethod
    def set_max_call_stack_size_to_capture(
        size: int,
    ) -> SetMaxCallStackSizeToCaptureCommand:
        """
        Creates a command to set the maximum call stack size to capture.

        Args:
            size (int): Maximum call stack size to capture.

        Returns:
            SetMaxCallStackSizeToCaptureCommand: Command object to set max call stack size.
        """
        params = SetMaxCallStackSizeToCaptureParams(size=size)
        return Command(method=RuntimeMethod.SET_MAX_CALL_STACK_SIZE_TO_CAPTURE, params=params)


================================================
FILE: pydoll/commands/storage_commands.py
================================================
from __future__ import annotations

from typing import TYPE_CHECKING, Optional

from pydoll.protocol.base import Command
from pydoll.protocol.storage.methods import (
    ClearCookiesParams,
    ClearDataForOriginParams,
    ClearDataForStorageKeyParams,
    ClearSharedStorageEntriesParams,
    ClearTrustTokensParams,
    DeleteSharedStorageEntryParams,
    DeleteStorageBucketParams,
    GetAffectedUrlsForThirdPartyCookieMetadataParams,
    GetCookiesParams,
    GetInterestGroupDetailsParams,
    GetSharedStorageEntriesParams,
    GetSharedStorageMetadataParams,
    GetStorageKeyForFrameParams,
    GetUsageAndQuotaParams,
    OverrideQuotaForOriginParams,
    ResetSharedStorageBudgetParams,
    SetAttributionReportingLocalTestingModeParams,
    SetAttributionReportingTrackingParams,
    SetCookiesParams,
    SetInterestGroupAuctionTrackingParams,
    SetInterestGroupTrackingParams,
    SetProtectedAudienceKAnonymityParams,
    SetSharedStorageEntryParams,
    SetSharedStorageTrackingParams,
    SetStorageBucketTrackingParams,
    StorageMethod,
    TrackCacheStorageForOriginParams,
    TrackCacheStorageForStorageKeyParams,
    TrackIndexedDBForOriginParams,
    TrackIndexedDBForStorageKeyParams,
    UntrackCacheStorageForOriginParams,
    UntrackCacheStorageForStorageKeyParams,
    UntrackIndexedDBForOriginParams,
    UntrackIndexedDBForStorageKeyParams,
)

if TYPE_CHECKING:
    from pydoll.protocol.network.types import CookieParam
    from pydoll.protocol.storage.methods import (
        ClearCookiesCommand,
        ClearDataForOriginCommand,
        ClearDataForStorageKeyCommand,
        ClearSharedStorageEntriesCommand,
        ClearTrustTokensCommand,
        DeleteSharedStorageEntryCommand,
        DeleteStorageBucketCommand,
        GetAffectedUrlsForThirdPartyCookieMetadataCommand,
        GetCookiesCommand,
        GetInterestGroupDetailsCommand,
        GetRelatedWebsiteSetsCommand,
        GetSharedStorageEntriesCommand,
        GetSharedStorageMetadataCommand,
        GetStorageKeyForFrameCommand,
        GetTrustTokensCommand,
        GetUsageAndQuotaCommand,
        OverrideQuotaForOriginCommand,
        ResetSharedStorageBudgetCommand,
        RunBounceTrackingMitigationsCommand,
        SendPendingAttributionReportsCommand,
        SetAttributionReportingLocalTestingModeCommand,
        SetAttributionReportingTrackingCommand,
        SetCookiesCommand,
        SetInterestGroupAuctionTrackingCommand,
        SetInterestGroupTrackingCommand,
        SetProtectedAudienceKAnonymityCommand,
        SetSharedStorageEntryCommand,
        SetSharedStorageTrackingCommand,
        SetStorageBucketTrackingCommand,
        TrackCacheStorageForOriginCommand,
        TrackCacheStorageForStorageKeyCommand,
        TrackIndexedDBForOriginCommand,
        TrackIndexedDBForStorageKeyCommand,
        UntrackCacheStorageForOriginCommand,
        UntrackCacheStorageForStorageKeyCommand,
        UntrackIndexedDBForOriginCommand,
        UntrackIndexedDBForStorageKeyCommand,
    )
    from pydoll.protocol.storage.types import StorageBucket


class StorageCommands:  # noqa: PLR0904
    """
    A class for interacting with browser storage using Chrome DevTools Protocol (CDP).

    The Storage domain of CDP allows managing various types of browser storage, including:
    - Cookies
    - Cache Storage
    - IndexedDB
    - Web Storage (localStorage/sessionStorage)
    - Shared Storage
    - Storage Buckets
    - Trust Tokens
    - Interest Groups
    - Attribution Reporting

    This class provides static methods that generate CDP commands to manage these types
    of storage without the need for traditional webdrivers.
    """

    @staticmethod
    def clear_cookies(browser_context_id: Optional[str] = None) -> ClearCookiesCommand:
        """
        Generates a command to clear all browser cookies.

        Args:
            browser_context_id: Browser context ID (optional). Useful when working
                               with multiple contexts (e.g., multiple windows or tabs).

        Returns:
            ClearCookiesCommand: The CDP command to clear all cookies.
        """
        params = ClearCookiesParams()
        if browser_context_id is not None:
            params['browserContextId'] = browser_context_id
        return Command(method=StorageMethod.CLEAR_COOKIES, params=params)

    @staticmethod
    def clear_data_for_origin(origin: str, storage_types: str) -> ClearDataForOriginCommand:
        """
        Generates a command to clear storage data for a specific origin.

        Args:
            origin: The security origin (e.g., "https://example.com").
            storage_types: Comma-separated list of storage types to clear.
                          Possible values include: "cookies", "local_storage", "indexeddb",
                          "cache_storage", etc. Use "all" to clear all types.

        Returns:
            ClearDataForOriginCommand: The CDP command to clear data for the specified origin.
        """
        params = ClearDataForOriginParams(origin=origin, storageTypes=storage_types)
        return Command(method=StorageMethod.CLEAR_DATA_FOR_ORIGIN, params=params)

    @staticmethod
    def clear_data_for_storage_key(
        storage_key: str, storage_types: str
    ) -> ClearDataForStorageKeyCommand:
        """
        Generates a command to clear data for a specific storage key.

        Args:
            storage_key: The storage key for which to clear data.
                        Unlike origin, a storage key is a more specific identifier
                        that may include partition isolation.
            storage_types: Comma-separated list of storage types to clear.
                          Possible values include: "cookies", "local_storage", "indexeddb",
                          "cache_storage", etc. Use "all" to clear all types.

        Returns:
            ClearDataForStorageKeyCommand: The CDP command to clear data for the specified storage
                key.
        """
        params = ClearDataForStorageKeyParams(storageKey=storage_key, storageTypes=storage_types)
        return Command(method=StorageMethod.CLEAR_DATA_FOR_STORAGE_KEY, params=params)

    @staticmethod
    def get_cookies(browser_context_id: Optional[str] = None) -> GetCookiesCommand:
        """
        Generates a command to get all browser cookies.

        Args:
            browser_context_id: Browser context ID (optional). Useful when working
                               with multiple contexts (e.g., multiple windows or tabs).

        Returns:
            GetCookiesCommand: The CDP command to get all cookies, which will return an array
                of Cookie objects.
        """
        params = GetCookiesParams()
        if browser_context_id is not None:
            params['browserContextId'] = browser_context_id
        return Command(method=StorageMethod.GET_COOKIES, params=params)

    @staticmethod
    def get_storage_key_for_frame(frame_id: str) -> GetStorageKeyForFrameCommand:
        """
        Generates a command to get the storage key for a specific frame.

        Storage keys are used to isolate data between different origins or
        partitions in the browser.

        Args:
            frame_id: The ID of the frame for which to get the storage key.

        Returns:
            GetStorageKeyForFrameCommand: The CDP command to get the storage key for the specified
                frame.
        """
        params = GetStorageKeyForFrameParams(frameId=frame_id)
        return Command(method=StorageMethod.GET_STORAGE_KEY_FOR_FRAME, params=params)

    @staticmethod
    def get_usage_and_quota(origin: str) -> GetUsageAndQuotaCommand:
        """
        Generates a command to get storage usage and quota information for an origin.

        Useful for monitoring or debugging storage consumption of a site.

        Args:
            origin: The security origin (e.g., "https://example.com") for which to get information.

        Returns:
            GetUsageAndQuotaCommand: The CDP command that will return:
                - usage: Storage usage in bytes
                - quota: Storage quota in bytes
                - usageBreakdown: Breakdown of usage by storage type
                - overrideActive: Whether there is an active quota override
        """
        params = GetUsageAndQuotaParams(origin=origin)
        return Command(method=StorageMethod.GET_USAGE_AND_QUOTA, params=params)

    @staticmethod
    def set_cookies(
        cookies: list[CookieParam], browser_context_id: Optional[str] = None
    ) -> SetCookiesCommand:
        """
        Generates a command to set browser cookies.

        Args:
            cookies: list of Cookie objects to set.
            browser_context_id: Browser context ID (optional). Useful when working
                               with multiple contexts (e.g., multiple windows or tabs).

        Returns:
            SetCookiesCommand: The CDP command to set the specified cookies.
        """
        params = SetCookiesParams(cookies=cookies)
        if browser_context_id is not None:
            params['browserContextId'] = browser_context_id
        return Command(method=StorageMethod.SET_COOKIES, params=params)

    @staticmethod
    def set_protected_audience_k_anonymity(
        owner: str, name: str, hashes: list[str]
    ) -> SetProtectedAudienceKAnonymityCommand:
        """
        Generates a command to set K-anonymity for protected audience.

        This command is used to configure anonymity in privacy-preserving advertising
        systems (part of Google's Privacy Sandbox).

        Args:
            owner: Owner of the K-anonymity configuration.
            name: Name of the K-anonymity configuration.
            hashes: list of hashes for the configuration.

        Returns:
            SetProtectedAudienceKAnonymityCommand: The CDP command to set protected audience
                K-anonymity.
        """
        params = SetProtectedAudienceKAnonymityParams(owner=owner, name=name, hashes=hashes)
        return Command(method=StorageMethod.SET_PROTECTED_AUDIENCE_K_ANONYMITY, params=params)

    @staticmethod
    def track_cache_storage_for_origin(origin: str) -> TrackCacheStorageForOriginCommand:
        """
        Generates a command to register an origin to receive notifications about changes
        to its Cache Storage.

        Cache Storage is primarily used by Service Workers to store resources for offline use.

        Args:
            origin: The security origin (e.g., "https://example.com") to monitor.

        Returns:
            TrackCacheStorageForOriginCommand: The CDP command to register monitoring of the
                origin's Cache Storage.
        """
        params = TrackCacheStorageForOriginParams(origin=origin)
        return Command(method=StorageMethod.TRACK_CACHE_STORAGE_FOR_ORIGIN, params=params)

    @staticmethod
    def track_cache_storage_for_storage_key(
        storage_key: str,
    ) -> TrackCacheStorageForStorageKeyCommand:
        """
        Generates a command to register a storage key to receive notifications
        about changes to its Cache Storage.

        Similar to track_cache_storage_for_origin, but uses the storage key
        for more precise isolation.

        Args:
            storage_key: The storage key to monitor.

        Returns:
            TrackCacheStorageForStorageKeyCommand: The CDP command to register monitoring of
                the key's Cache Storage.
        """
        params = TrackCacheStorageForStorageKeyParams(storageKey=storage_key)
        return Command(method=StorageMethod.TRACK_CACHE_STORAGE_FOR_STORAGE_KEY, params=params)

    @staticmethod
    def track_indexed_db_for_origin(origin: str) -> TrackIndexedDBForOriginCommand:
        """
        Generates a command to register an origin to receive notifications about changes
        to its IndexedDB.

        IndexedDB is a NoSQL database system in the browser for storing
        large amounts of structured data.

        Args:
            origin: The security origin (e.g., "https://example.com") to monitor.

        Returns:
            TrackIndexedDBForOriginCommand: The CDP command to register monitoring of
                the origin's IndexedDB.
        """
        params = TrackIndexedDBForOriginParams(origin=origin)
        return Command(method=StorageMethod.TRACK_INDEXED_DB_FOR_ORIGIN, params=params)

    @staticmethod
    def track_indexed_db_for_storage_key(storage_key: str) -> TrackIndexedDBForStorageKeyCommand:
        """
        Generates a command to register a storage key to receive notifications
        about changes to its IndexedDB.

        Similar to track_indexed_db_for_origin, but uses the storage key
        for more precise isolation.

        Args:
            storage_key: The storage key to monitor.

        Returns:
            TrackIndexedDBForStorageKeyCommand: The CDP command to register monitoring of
                the key's IndexedDB.
        """
        params = TrackIndexedDBForStorageKeyParams(storageKey=storage_key)
        return Command(method=StorageMethod.TRACK_INDEXED_DB_FOR_STORAGE_KEY, params=params)

    @staticmethod
    def untrack_cache_storage_for_origin(origin: str) -> UntrackCacheStorageForOriginCommand:
        """
        Generates a command to unregister an origin from receiving notifications
        about changes to its Cache Storage.

        Use this method to stop monitoring Cache Storage after using track_cache_storage_for_origin.

        Args:
            origin: The security origin (e.g., "https://example.com") to stop monitoring.

        Returns:
            UntrackCacheStorageForOriginCommand: The CDP command to cancel monitoring of the
                origin's Cache Storage.
        """
        params = UntrackCacheStorageForOriginParams(origin=origin)
        return Command(method=StorageMethod.UNTRACK_CACHE_STORAGE_FOR_ORIGIN, params=params)

    @staticmethod
    def untrack_cache_storage_for_storage_key(
        storage_key: str,
    ) -> UntrackCacheStorageForStorageKeyCommand:
        """
        Generates a command to unregister a storage key from receiving notifications
        about changes to its Cache Storage.

        Use this method to stop monitoring Cache Storage after using
        track_cache_storage_for_storage_key.

        Args:
            storage_key: The storage key to stop monitoring.

        Returns:
            UntrackCacheStorageForStorageKeyCommand: The CDP command to cancel monitoring of
                the key's Cache Storage.
        """
        params = UntrackCacheStorageForStorageKeyParams(storageKey=storage_key)
        return Command(method=StorageMethod.UNTRACK_CACHE_STORAGE_FOR_STORAGE_KEY, params=params)

    @staticmethod
    def untrack_indexed_db_for_origin(origin: str) -> UntrackIndexedDBForOriginCommand:
        """
        Generates a command to unregister an origin from receiving notifications
        about changes to its IndexedDB.

        Use this method to stop monitoring IndexedDB after using track_indexed_db_for_origin.

        Args:
            origin: The security origin (e.g., "https://example.com") to stop monitoring.

        Returns:
            UntrackIndexedDBForOriginCommand: The CDP command to cancel monitoring of
                the origin's IndexedDB.
        """
        params = UntrackIndexedDBForOriginParams(origin=origin)
        return Command(method=StorageMethod.UNTRACK_INDEXED_DB_FOR_ORIGIN, params=params)

    @staticmethod
    def untrack_indexed_db_for_storage_key(
        storage_key: str,
    ) -> UntrackIndexedDBForStorageKeyCommand:
        """
        Generates a command to unregister a storage key from receiving notifications
        about changes to its IndexedDB.

        Use this method to stop monitoring IndexedDB after using track_indexed_db_for_storage_key.

        Args:
            storage_key: The storage key to stop monitoring.

        Returns:
            UntrackIndexedDBForStorageKeyCommand: The CDP command to cancel monitoring
                of the key's IndexedDB.
        """
        params = UntrackIndexedDBForStorageKeyParams(storageKey=storage_key)
        return Command(method=StorageMethod.UNTRACK_INDEXED_DB_FOR_STORAGE_KEY, params=params)

    @staticmethod
    def clear_shared_storage_entries(owner_origin: str) -> ClearSharedStorageEntriesCommand:
        """
        Generates a command to clear all Shared Storage entries for a specific origin.

        Shared Storage is an experimental API that allows cross-origin shared storage
        with privacy protections.

        Args:
            owner_origin: The owner origin of the Shared Storage to clear.

        Returns:
            ClearSharedStorageEntriesCommand: The CDP command to clear the Shared Storage entries.
        """
        params = ClearSharedStorageEntriesParams(ownerOrigin=owner_origin)
        return Command(method=StorageMethod.CLEAR_SHARED_STORAGE_ENTRIES, params=params)

    @staticmethod
    def clear_trust_tokens(issuer_origin: str) -> ClearTrustTokensCommand:
        """
        Generates a command to remove all Trust Tokens issued by the specified origin.

        Trust Tokens are an experimental API for combating fraud while preserving user
        privacy. This command keeps other stored data, including the issuer's redemption
        records, intact.

        Args:
            issuer_origin: The issuer origin of the tokens to remove.

        Returns:
            ClearTrustTokensCommand: The CDP command to clear Trust Tokens, which will return:
                - didDeleteTokens: True if any tokens were deleted, False otherwise.
        """
        params = ClearTrustTokensParams(issuerOrigin=issuer_origin)
        return Command(method=StorageMethod.CLEAR_TRUST_TOKENS, params=params)

    @staticmethod
    def delete_shared_storage_entry(owner_origin: str, key: str) -> DeleteSharedStorageEntryCommand:
        """
        Generates a command to delete a specific Shared Storage entry.

        Args:
            owner_origin: The owner origin of the Shared Storage.
            key: The key of the entry to delete.

        Returns:
            DeleteSharedStorageEntryCommand: The CDP command to delete the Shared Storage entry.
        """
        params = DeleteSharedStorageEntryParams(ownerOrigin=owner_origin, key=key)
        return Command(method=StorageMethod.DELETE_SHARED_STORAGE_ENTRY, params=params)

    @staticmethod
    def delete_storage_bucket(bucket: StorageBucket) -> DeleteStorageBucketCommand:
        """
        Generates a command to delete a Storage Bucket with the specified key and name.

        Storage Buckets are an experimental API for managing storage data with
        greater granularity and expiration control.

        Args:
            bucket: A StorageBucket object containing the storageKey and name of the bucket
                to delete.

        Returns:
            DeleteStorageBucketCommand: The CDP command to delete the Storage Bucket.
        """
        params = DeleteStorageBucketParams(bucket=bucket)
        return Command(method=StorageMethod.DELETE_STORAGE_BUCKET, params=params)

    @staticmethod
    def get_affected_urls_for_third_party_cookie_metadata(
        first_party_url: str, third_party_urls: list[str]
    ) -> GetAffectedUrlsForThirdPartyCookieMetadataCommand:
        """
        Generates a command to get the list of URLs from a page and its embedded resources
        that match existing grace period URL pattern rules.

        This command is useful for monitoring which URLs would be affected by the
        Privacy Sandbox's third-party cookie policies.

        Args:
            first_party_url: The URL of the page being visited (first-party).
            third_party_urls: Optional list of embedded third-party resource URLs.

        Returns:
            GetAffectedUrlsForThirdPartyCookieMetadataCommand: The CDP command to get URLs
                affected by third-party cookie metadata.
        """
        params = GetAffectedUrlsForThirdPartyCookieMetadataParams(
            firstPartyUrl=first_party_url, thirdPartyUrls=third_party_urls
        )
        return Command(
            method=StorageMethod.GET_AFFECTED_URLS_FOR_THIRD_PARTY_COOKIE_METADATA, params=params
        )

    @staticmethod
    def get_interest_group_details(owner_origin: str, name: str) -> GetInterestGroupDetailsCommand:
        """
        Generates a command to get details of a specific interest group.

        Interest Groups are part of the FLEDGE/Protected Audience API for privacy-preserving
        advertising, enabling in-browser ad auctions.

        Args:
            owner_origin: The owner origin of the interest group.
            name: The name of the interest group.

        Returns:
            GetInterestGroupDetailsCommand: The CDP command to get interest group details.
        """
        params = GetInterestGroupDetailsParams(ownerOrigin=owner_origin, name=name)
        return Command(method=StorageMethod.GET_INTEREST_GROUP_DETAILS, params=params)

    @staticmethod
    def get_related_website_sets() -> GetRelatedWebsiteSetsCommand:
        """
        Generates a command to get related website sets.

        Related Website Sets are an API that allows sites under the same entity
        to share some data, despite third-party cookie restrictions.

        Returns:
            GetRelatedWebsiteSetsCommand: The CDP command to get related website sets.
        """
        return Command(method=StorageMethod.GET_RELATED_WEBSITE_SETS)

    @staticmethod
    def get_shared_storage_entries(owner_origin: str) -> GetSharedStorageEntriesCommand:
        """
        Generates a command to get all Shared Storage entries for an origin.

        Args:
            owner_origin: The owner origin of the Shared Storage.

        Returns:
            GetSharedStorageEntriesCommand: The CDP command to get the Shared Storage entries.
        """
        params = GetSharedStorageEntriesParams(ownerOrigin=owner_origin)
        return Command(method=StorageMethod.GET_SHARED_STORAGE_ENTRIES, params=params)

    @staticmethod
    def get_shared_storage_metadata(owner_origin: str) -> GetSharedStorageMetadataCommand:
        """
        Generates a command to get Shared Storage metadata for an origin.

        Metadata includes information such as usage, budget, and creation time.

        Args:
            owner_origin: The owner origin of the Shared Storage.

        Returns:
            GetSharedStorageMetadataCommand: The CDP command to get Shared Storage metadata.
        """
        params = GetSharedStorageMetadataParams(ownerOrigin=owner_origin)
        return Command(method=StorageMethod.GET_SHARED_STORAGE_METADATA, params=params)

    @staticmethod
    def get_trust_tokens() -> GetTrustTokensCommand:
        """
        Generates a command to get all available Trust Tokens.

        Returns:
            GetTrustTokensCommand: The CDP command to get Trust Tokens, which will return pairs
                    of issuer origin and count of available tokens.
        """
        return Command(method=StorageMethod.GET_TRUST_TOKENS, params={})

    @staticmethod
    def override_quota_for_origin(
        origin: str, quota_size: Optional[float] = None
    ) -> OverrideQuotaForOriginCommand:
        """
        Generates a command to override the storage quota for a specific origin.

        This command is useful for storage exhaustion testing or simulating
        different storage conditions.

        Args:
            origin: The origin for which to override the quota.
            quota_size: The size of the new quota in bytes (optional).
                       If not specified, any existing override will be removed.

        Returns:
            OverrideQuotaForOriginCommand: The CDP command to override the origin's quota.
        """
        params = OverrideQuotaForOriginParams(origin=origin)
        if quota_size is not None:
            params['quotaSize'] = quota_size
        return Command(method=StorageMethod.OVERRIDE_QUOTA_FOR_ORIGIN, params=params)

    @staticmethod
    def reset_shared_storage_budget(owner_origin: str) -> ResetSharedStorageBudgetCommand:
        """
        Generates a command to reset the Shared Storage budget for an origin.

        Shared Storage uses a budget system to limit the amount of operations
        or specific operations to preserve user privacy.

        Args:
            owner_origin: The owner origin of the Shared Storage.

        Returns:
            ResetSharedStorageBudgetCommand: The CDP command to reset the Shared Storage budget.
        """
        params = ResetSharedStorageBudgetParams(ownerOrigin=owner_origin)
        return Command(method=StorageMethod.RESET_SHARED_STORAGE_BUDGET, params=params)

    @staticmethod
    def run_bounce_tracking_mitigations() -> RunBounceTrackingMitigationsCommand:
        """
        Generates a command to run bounce tracking mitigations.

        Bounce tracking is a tracking technique that involves redirecting users
        through intermediate URLs to establish tracking cookies.
        This command activates protections against this technique.

        Returns:
            RunBounceTrackingMitigationsCommand: The CDP command to run bounce tracking mitigations.
        """
        return Command(method=StorageMethod.RUN_BOUNCE_TRACKING_MITIGATIONS, params={})

    @staticmethod
    def send_pending_attribution_reports() -> SendPendingAttributionReportsCommand:
        """
        Generates a command to send pending attribution reports.

        Attribution Reporting is an API that allows measuring conversions while
        preserving user privacy. This command forces sending reports that
        are waiting to be sent.

        Returns:
            SendPendingAttributionReportsCommand: The CDP command to send pending attribution
                reports.
        """
        return Command(method=StorageMethod.SEND_PENDING_ATTRIBUTION_REPORTS, params={})

    @staticmethod
    def set_attribution_reporting_local_testing_mode(
        enabled: bool,
    ) -> SetAttributionReportingLocalTestingModeCommand:
        """
        Generates a command to enable or disable local testing mode for Attribution Reporting.

        Testing mode makes it easier to develop and test the Attribution Reporting API
        by removing restrictions like delays and rate limits that would normally apply.

        Args:
            enabled: True to enable local testing mode, False to disable it.

        Returns:
            SetAttributionReportingLocalTestingModeCommand: The CDP command to set Attribution
                Reporting local testing mode.
        """
        params = SetAttributionReportingLocalTestingModeParams(enabled=enabled)
        return Command(
            method=StorageMethod.SET_ATTRIBUTION_REPORTING_LOCAL_TESTING_MODE, params=params
        )

    @staticmethod
    def set_attribution_reporting_tracking(enable: bool) -> SetAttributionReportingTrackingCommand:
        """
        Generates a command to enable or disable Attribution Reporting tracking.

        Args:
            enable: True to enable tracking, False to disable it.

        Returns:
            SetAttributionReportingTrackingCommand: The CDP command to set Attribution
                Reporting tracking.
        """
        params = SetAttributionReportingTrackingParams(enable=enable)
        return Command(method=StorageMethod.SET_ATTRIBUTION_REPORTING_TRACKING, params=params)

    @staticmethod
    def set_interest_group_auction_tracking(enable: bool) -> SetInterestGroupAuctionTrackingCommand:
        """
        Generates a command to enable or disable interest group auction tracking.

        Interest group auctions are part of the FLEDGE/Protected Audience API and
        allow for in-browser ad auctions in a privacy-preserving way.

        Args:
            enable: True to enable tracking, False to disable it.

        Returns:
            SetInterestGroupAuctionTrackingCommand: The CDP command to set interest group
                auction tracking.
        """
        params = SetInterestGroupAuctionTrackingParams(enable=enable)
        return Command(method=StorageMethod.SET_INTEREST_GROUP_AUCTION_TRACKING, params=params)

    @staticmethod
    def set_interest_group_tracking(enable: bool) -> SetInterestGroupTrackingCommand:
        """
        Generates a command to enable or disable interest group tracking.

        Args:
            enable: True to enable tracking, False to disable it.

        Returns:
            SetInterestGroupTrackingCommand: The CDP command to set interest group tracking.
        """
        params = SetInterestGroupTrackingParams(enable=enable)
        return Command(method=StorageMethod.SET_INTEREST_GROUP_TRACKING, params=params)

    @staticmethod
    def set_shared_storage_entry(
        owner_origin: str, key: str, value: str, ignore_if_present: Optional[bool] = None
    ) -> SetSharedStorageEntryCommand:
        """
        Generates a command to set an entry in Shared Storage.

        Args:
            owner_origin: The owner origin of the Shared Storage.
            key: The key of the entry to set.
            value: The value of the entry to set.
            ignore_if_present: If True, won't replace an existing entry with the same key.

        Returns:
            SetSharedStorageEntryCommand: The CDP command to set a Shared Storage entry.
        """
        params = SetSharedStorageEntryParams(ownerOrigin=owner_origin, key=key, value=value)
        if ignore_if_present is not None:
            params['ignoreIfPresent'] = ignore_if_present
        return Command(method=StorageMethod.SET_SHARED_STORAGE_ENTRY, params=params)

    @staticmethod
    def set_shared_storage_tracking(enable: bool) -> SetSharedStorageTrackingCommand:
        """
        Generates a command to enable or disable Shared Storage tracking.

        When enabled, events related to Shared Storage usage will be emitted.

        Args:
            enable: True to enable tracking, False to disable it.

        Returns:
            SetSharedStorageTrackingCommand: The CDP command to set Shared Storage tracking.
        """
        params = SetSharedStorageTrackingParams(enable=enable)
        return Command(method=StorageMethod.SET_SHARED_STORAGE_TRACKING, params=params)

    @staticmethod
    def set_storage_bucket_tracking(
        storage_key: str, enable: bool
    ) -> SetStorageBucketTrackingCommand:
        """
        Generates a command to enable or disable Storage Bucket tracking.

        When enabled, events related to changes in storage buckets will be emitted.

        Args:
            storage_key: The storage key for which to set tracking.
            enable: True to enable tracking, False to disable it.

        Returns:
            SetStorageBucketTrackingCommand: The CDP command to set Storage Bucket tracking.
        """
        params = SetStorageBucketTrackingParams(storageKey=storage_key, enable=enable)
        return Command(method=StorageMethod.SET_STORAGE_BUCKET_TRACKING, params=params)


================================================
FILE: pydoll/commands/target_commands.py
================================================
from __future__ import annotations

from typing import TYPE_CHECKING, Optional

from pydoll.protocol.base import Command
from pydoll.protocol.target.methods import (
    ActivateTargetParams,
    AttachToBrowserTargetParams,
    AttachToTargetParams,
    CloseTargetParams,
    CreateBrowserContextParams,
    CreateTargetParams,
    DetachFromTargetParams,
    DisposeBrowserContextParams,
    GetTargetInfoParams,
    GetTargetsParams,
    SetAutoAttachParams,
    SetDiscoverTargetsParams,
    SetRemoteLocationsParams,
    TargetMethod,
)

if TYPE_CHECKING:
    from pydoll.protocol.browser.types import WindowState
    from pydoll.protocol.target.methods import (
        ActivateTargetCommand,
        AttachToBrowserTargetCommand,
        AttachToTargetCommand,
        CloseTargetCommand,
        CreateBrowserContextCommand,
        CreateTargetCommand,
        DetachFromTargetCommand,
        DisposeBrowserContextCommand,
        GetBrowserContextsCommand,
        GetTargetInfoCommand,
        GetTargetsCommand,
        SetAutoAttachCommand,
        SetDiscoverTargetsCommand,
        SetRemoteLocationsCommand,
    )
    from pydoll.protocol.target.types import RemoteLocation


class TargetCommands:
    """
    A class for managing browser targets using Chrome DevTools Protocol.

    The Target domain of CDP supports additional targets discovery and allows to attach to them.
    Targets can represent browser tabs, windows, frames, web workers, service workers, etc.
    The domain provides methods to create, discover, and control these targets.

    This class provides methods to create commands for interacting with browser targets,
    including creating, activating, attaching to, and closing targets through CDP commands.
    """

    @staticmethod
    def activate_target(target_id: str) -> ActivateTargetCommand:
        """
        Generates a command to activate (focus) a target.

        Args:
            target_id: ID of the target to activate.

        Returns:
            Command: The CDP command to activate the target.
        """
        params = ActivateTargetParams(targetId=target_id)
        return Command(method=TargetMethod.ACTIVATE_TARGET, params=params)

    @staticmethod
    def attach_to_target(target_id: str, flatten: Optional[bool] = None) -> AttachToTargetCommand:
        """
        Generates a command to attach to a target with the given ID.

        When attached to a target, you can send commands to it and receive events from it.
        This is essential for controlling and automating targets like browser tabs.

        Args:
            target_id: ID of the target to attach to.
            flatten: If true, enables "flat" access to the session via specifying sessionId
                    attribute in the commands. This is recommended as the non-flattened
                    mode is being deprecated. See https://crbug.com/991325

        Returns:
            Command: The CDP command to attach to the target, which will return a sessionId.
        """
        params = AttachToTargetParams(targetId=target_id)
        if flatten is not None:
            params['flatten'] = flatten
        return Command(method=TargetMethod.ATTACH_TO_TARGET, params=params)

    @staticmethod
    def close_target(target_id: str) -> CloseTargetCommand:
        """
        Generates a command to close a target.

        If the target is a page or a tab, it will be closed. This is equivalent to
        clicking the close button on a browser tab.

        Args:
            target_id: ID of the target to close.

        Returns:
            Command: The CDP command to close the target, which will return a success flag.
        """
        params = CloseTargetParams(targetId=target_id)
        return Command(method=TargetMethod.CLOSE_TARGET, params=params)

    @staticmethod
    def create_browser_context(
        dispose_on_detach: Optional[bool] = None,
        proxy_server: Optional[str] = None,
        proxy_bypass_list: Optional[str] = None,
        origins_with_universal_network_access: Optional[list[str]] = None,
    ) -> CreateBrowserContextCommand:
        """
        Generates a command to create a new empty browser context.

        A browser context is similar to an incognito profile but you can have more than one.
        Each context has its own set of cookies, local storage, and other browser data.
        This is useful for testing multiple users or isolating sessions.

        Args:
            dispose_on_detach: If specified, the context will be disposed when the
                              debugging session disconnects.
            proxy_server: Proxy server string, similar to the one passed to --proxy-server
                         command line argument (e.g., "socks5://192.168.1.100:1080").
            proxy_bypass_list: Proxy bypass list, similar to the one passed to
                               --proxy-bypass-list command line argument
                               (e.g., "*.example.com,localhost").
            origins_with_universal_network_access: An optional list of origins to grant
                                                  unlimited cross-origin access to.
                                                  Parts of the URL other than those
                                                  constituting origin are ignored.

        Returns:
            Command: The CDP command to create a browser context, which will return
                    the ID of the created context.
        """
        params = CreateBrowserContextParams()
        if dispose_on_detach is not None:
            params['disposeOnDetach'] = dispose_on_detach
        if proxy_server is not None:
            params['proxyServer'] = proxy_server
        if proxy_bypass_list is not None:
            params['proxyBypassList'] = proxy_bypass_list
        if origins_with_universal_network_access is not None:
            params['originsWithUniversalNetworkAccess'] = origins_with_universal_network_access
        return Command(method=TargetMethod.CREATE_BROWSER_CONTEXT, params=params)

    @staticmethod
    def create_target(
        url: str = 'about:blank',
        left: Optional[int] = None,
        top: Optional[int] = None,
        width: Optional[int] = None,
        height: Optional[int] = None,
        window_state: Optional[WindowState] = None,
        browser_context_id: Optional[str] = None,
        enable_begin_frame_control: Optional[bool] = None,
        new_window: Optional[bool] = None,
        background: Optional[bool] = None,
        for_tab: Optional[bool] = None,
        hidden: Optional[bool] = None,
    ) -> CreateTargetCommand:
        """
        Generates a command to create a new page (target).

        This is one of the primary methods to open a new tab or window with specific
        properties such as position, size, and browser context.

        Args:
            url: The initial URL the page will navigate to. An empty string indicates about:blank.
            left: Frame left position in device-independent pixels (DIP).
                 Requires newWindow to be true or in headless mode.
            top: Frame top position in DIP. Requires newWindow to be true or in headless mode.
            width: Frame width in DIP.
            height: Frame height in DIP.
            window_state: Frame window state: normal, minimized, maximized, or fullscreen.
                         Default is normal.
            browser_context_id: The browser context to create the page in.
                               If not specified, the default browser context is used.
            enable_begin_frame_control: Whether BeginFrames for this target will be controlled
                                       via DevTools (headless shell only, not supported on
                                       MacOS yet, false by default).
            new_window: Whether to create a new window or tab (false by default,
                       not supported by headless shell).
            background: Whether to create the target in background or foreground
                       (false by default, not supported by headless shell).
            for_tab: Whether to create the target of type "tab".
            hidden: Whether to create a hidden target. The hidden target is observable via
                   protocol, but not present in the tab UI strip. Cannot be created with
                   forTab:true, newWindow:true or background:false. The life-time of the
                   tab is limited to the life-time of the session.

        Returns:
            Command: The CDP command to create a target, which will return the ID
                of the created target.
        """
        params = CreateTargetParams(url=url)
        if left is not None:
            params['left'] = left
        if top is not None:
            params['top'] = top
        if width is not None:
            params['width'] = width
        if height is not None:
            params['height'] = height
        if window_state is not None:
            params['windowState'] = window_state
        if browser_context_id is not None:
            params['browserContextId'] = browser_context_id
        if enable_begin_frame_control is not None:
            params['enableBeginFrameControl'] = enable_begin_frame_control
        if new_window is not None:
            params['newWindow'] = new_window
        if background is not None:
            params['background'] = background
        if for_tab is not None:
            params['forTab'] = for_tab
        if hidden is not None:
            params['hidden'] = hidden
        return Command(method=TargetMethod.CREATE_TARGET, params=params)

    @staticmethod
    def detach_from_target(session_id: Optional[str] = None) -> DetachFromTargetCommand:
        """
        Generates a command to detach a session from its target.

        After detaching, you will no longer receive events from the target and
        cannot send commands to it.

        Args:
            session_id: Session ID to detach. If not specified, detaches all sessions.

        Returns:
            Command: The CDP command to detach from the target.
        """
        params = DetachFromTargetParams()
        if session_id is not None:
            params['sessionId'] = session_id
        return Command(method=TargetMethod.DETACH_FROM_TARGET, params=params)

    @staticmethod
    def dispose_browser_context(browser_context_id: str) -> DisposeBrowserContextCommand:
        """
        Generates a command to delete a browser context.

        All pages belonging to the browser context will be closed without calling
        their beforeunload hooks. This is similar to closing an incognito profile.

        Args:
            browser_context_id: The ID of the browser context to dispose.

        Returns:
            Command: The CDP command to dispose the browser context.
        """
        params = DisposeBrowserContextParams(browserContextId=browser_context_id)
        return Command(method=TargetMethod.DISPOSE_BROWSER_CONTEXT, params=params)

    @staticmethod
    def get_browser_contexts() -> GetBrowserContextsCommand:
        """
        Generates a command to get all browser contexts created with createBrowserContext.

        This is useful for obtaining a list of all available contexts for managing
        multiple isolated browser sessions.

        Returns:
            Command: The CDP command to get all browser contexts, which will return
                    an array of browser context IDs.
        """
        return Command(method=TargetMethod.GET_BROWSER_CONTEXTS, params={})

    @staticmethod
    def get_targets(filter: Optional[list] = None) -> GetTargetsCommand:
        """
        Generates a command to retrieve a list of available targets.

        Targets include tabs, extensions, web workers, and other attachable entities
        in the browser. This is useful for discovering what targets exist before
        attaching to them.

        Args:
            filter: Only targets matching the filter will be reported. If filter is not
                   specified and target discovery is currently enabled, a filter used for
                   target discovery is used for consistency.

        Returns:
            Command: The CDP command to get targets, which will return a list of
                    TargetInfo objects with details about each target.
        """
        params = GetTargetsParams()
        if filter is not None:
            params['filter'] = filter
        return Command(method=TargetMethod.GET_TARGETS, params=params)

    @staticmethod
    def set_auto_attach(
        auto_attach: bool,
        wait_for_debugger_on_start: bool = False,
        flatten: Optional[bool] = None,
        filter: Optional[list] = None,
    ) -> SetAutoAttachCommand:
        """
        Generates a command to control whether to automatically attach to new targets.

        This method controls whether to automatically attach to new targets which are
        considered to be directly related to the current one (for example, iframes or workers).
        When turned on, it also attaches to all existing related targets. When turned off,
        it automatically detaches from all currently attached targets.

        Args:
            auto_attach: Whether to auto-attach to related targets.
            wait_for_debugger_on_start: Whether to pause new targets when attaching to them.
                                       Use Runtime.runIfWaitingForDebugger to run paused targets.
            flatten: Enables "flat" access to the session via specifying sessionId attribute
                    in the commands. This mode is being preferred, and non-flattened mode
                    is being deprecated (see crbug.com/991325).
            filter: Only targets matching filter will be attached.

        Returns:
            Command: The CDP command to set auto-attach behavior.
        """
        params = SetAutoAttachParams(
            autoAttach=auto_attach, waitForDebuggerOnStart=wait_for_debugger_on_start
        )
        if flatten is not None:
            params['flatten'] = flatten
        if filter is not None:
            params['filter'] = filter
        return Command(method=TargetMethod.SET_AUTO_ATTACH, params=params)

    @staticmethod
    def set_discover_targets(
        discover: bool, filter: Optional[list] = None
    ) -> SetDiscoverTargetsCommand:
        """
        Generates a command to control target discovery.

        This method controls whether to discover available targets and notify via
        targetCreated/targetInfoChanged/targetDestroyed events. Target discovery is useful
        for monitoring when new tabs, workers, or other targets are created or destroyed.

        Args:
            discover: Whether to discover available targets.
            filter: Only targets matching filter will be discovered. If discover is false,
                   filter must be omitted or empty.

        Returns:
            Command: The CDP command to set target discovery.
        """
        params = SetDiscoverTargetsParams(discover=discover)
        if filter is not None:
            params['filter'] = filter
        return Command(method=TargetMethod.SET_DISCOVER_TARGETS, params=params)

    @staticmethod
    def attach_to_browser_target(session_id: str) -> AttachToBrowserTargetCommand:
        """
        Generates a command to attach to the browser target.

        This is an experimental method that attaches to the browser target,
        only using flat sessionId mode. The browser target is a special target that
        represents the browser itself rather than a page or other content.

        Args:
            session_id: ID of the session to attach to the browser target.

        Returns:
            Command: The CDP command to attach to the browser target,
                    which will return a new session ID.
        """
        params = AttachToBrowserTargetParams(sessionId=session_id)
        return Command(method=TargetMethod.ATTACH_TO_BROWSER_TARGET, params=params)

    @staticmethod
    def get_target_info(target_id: str) -> GetTargetInfoCommand:
        """
        Generates a command to get information about a specific target.

        This experimental method returns detailed information about a target,
        such as its type, URL, title, and other properties.

        Args:
            target_id: ID of the target to get information about.

        Returns:
            Command: The CDP command to get target information, which will return
                    a TargetInfo object with details about the target.
        """
        params = GetTargetInfoParams(targetId=target_id)
        return Command(method=TargetMethod.GET_TARGET_INFO, params=params)

    @staticmethod
    def set_remote_locations(locations: list[RemoteLocation]) -> SetRemoteLocationsCommand:
        """
        Generates a command to enable target discovery for specified remote locations.

        This experimental method enables target discovery for remote locations when
        setDiscoverTargets was set to true. This is useful for discovering targets
        on remote devices or in different browser instances.

        Args:
            locations: list of remote locations, each containing a host and port.

        Returns:
            Command: The CDP command to set remote locations for target discovery.
        """
        params = SetRemoteLocationsParams(locations=locations)
        return Command(method=TargetMethod.SET_REMOTE_LOCATIONS, params=params)


================================================
FILE: pydoll/connection/__init__.py
================================================
from pydoll.connection.connection_handler import ConnectionHandler

__all__ = [
    'ConnectionHandler',
]


================================================
FILE: pydoll/connection/connection_handler.py
================================================
from __future__ import annotations

import asyncio
import json
import logging
from contextlib import suppress
from typing import TYPE_CHECKING, cast

import websockets
from websockets.asyncio.client import ClientConnection
from websockets.protocol import State

from pydoll.connection.managers import CommandsManager, EventsManager
from pydoll.exceptions import (
    CommandExecutionTimeout,
    WebSocketConnectionClosed,
)
from pydoll.protocol.base import CDPEvent, Response
from pydoll.utils import get_browser_ws_address

if TYPE_CHECKING:
    from typing import Any, AsyncGenerator, Awaitable, Callable, Coroutine, Optional, Union

    from websockets.asyncio.client import connect as Connect

    from pydoll.protocol.base import Command, T_CommandParams, T_CommandResponse

logger = logging.getLogger(__name__)


class ConnectionHandler:
    """
    WebSocket connection manager for Chrome DevTools Protocol endpoints.

    Handles connection lifecycle, command execution, and event subscription
    for both browser-level and page-level CDP endpoints.
    """

    def __init__(
        self,
        connection_port: Optional[int] = None,
        page_id: Optional[str] = None,
        ws_address_resolver: Callable[[int], Coroutine[Any, Any, str]] = get_browser_ws_address,
        ws_connector: type[Connect] = websockets.connect,
        ws_address: Optional[str] = None,
    ):
        """
        Initialize connection handler.

        Args:
            connection_port: Browser's debugging server port.
            page_id: Target page ID. If None, connects to browser-level endpoint.
            ws_address_resolver: Function to resolve WebSocket URL from port.
            ws_connector: WebSocket connection factory (mainly for testing).
            ws_address: WebSocket address. It has priority over connection_port and page_id.
        """
        self._connection_port = connection_port
        self._page_id = page_id
        self._ws_address_resolver = ws_address_resolver
        self._ws_connector = ws_connector
        self._ws_address = ws_address
        self._ws_connection: Optional[ClientConnection] = None
        self._command_manager = CommandsManager()
        self._events_handler = EventsManager()
        self._receive_task: Optional[asyncio.Task] = None
        logger.info('ConnectionHandler initialized.')
        logger.debug(
            f'Init params: port={self._connection_port}, page_id={self._page_id}, '
            f'ws_address_set={bool(self._ws_address)}'
        )

    @property
    def network_logs(self):
        """Access captured network request and response logs."""
        return self._events_handler.network_logs

    @property
    def dialog(self):
        """Access currently active JavaScript dialog information."""
        return self._events_handler.dialog

    async def ping(self) -> bool:
        """Test if WebSocket connection is active and responsive."""
        with suppress(Exception):
            logger.debug('Pinging WebSocket connection')
            await self._ensure_active_connection()
            await cast(ClientConnection, self._ws_connection).ping()
            logger.debug('Ping OK')
            return True
        return False

    async def execute_command(
        self, command: Command[T_CommandParams, T_CommandResponse], timeout: int = 60
    ) -> T_CommandResponse:
        """
        Send CDP command and await response.

        Args:
            command: CDP command to send.
            timeout: Maximum seconds to wait for response.

        Returns:
            Parsed response object matching command's expected type.

        Raises:
            CommandExecutionTimeout: If browser doesn't respond within timeout.
            WebSocketConnectionClosed: If connection closes during execution.
        """
        await self._ensure_active_connection()
        future = self._command_manager.create_command_future(command)
        command_str = json.dumps(command)

        try:
            ws = cast(ClientConnection, self._ws_connection)
            logger.debug(
                f'Sending command: id={command.get("id")}, method={command.get("method")}, '
                f'timeout={timeout}s'
            )
            start = asyncio.get_event_loop().time()
            await ws.send(command_str)
            response: str = await asyncio.wait_for(future, timeout)
            elapsed = asyncio.get_event_loop().time() - start
            logger.debug(f'Command completed: id={command.get("id")} in {elapsed:.3f}s')
            return json.loads(response)
        except asyncio.TimeoutError:
            self._command_manager.remove_pending_command(command['id'])
            logger.error(
                f'Command timeout: id={command.get("id")}, method={command.get("method")}, '
                f'timeout={timeout}s'
            )
            raise CommandExecutionTimeout()
        except websockets.ConnectionClosed:
            await self._handle_connection_loss()
            logger.warning(f'WebSocket connection closed during command: id={command.get("id")}')
            raise WebSocketConnectionClosed()

    async def register_callback(
        self,
        event_name: str,
        callback: Callable[[dict], Awaitable[None]],
        temporary: bool = False,
    ) -> int:
        """
        Register event listener for CDP events.

        Args:
            event_name: CDP event name (e.g., 'Page.loadEventFired').
            callback: Async function called when event occurs.
            temporary: If True, callback removed after first trigger.

        Returns:
            Callback ID for later removal.

        Note:
            Corresponding CDP domain must be enabled before events fire.
        """
        callback_id = self._events_handler.register_callback(event_name, callback, temporary)
        logger.debug(
            f'Registered callback: id={callback_id}, event={event_name}, temporary={temporary}'
        )
        return callback_id

    async def remove_callback(self, callback_id: int) -> bool:
        """Remove registered event callback by ID."""
        removed = self._events_handler.remove_callback(callback_id)
        logger.debug(f'Removed callback: id={callback_id}, removed={removed}')
        return removed

    async def clear_callbacks(self):
        """Remove all registered event callbacks."""
        logger.debug('Clearing all callbacks')
        self._events_handler.clear_callbacks()

    async def close(self):
        """Close WebSocket connection and release resources."""
        await self.clear_callbacks()
        if self._ws_connection is None:
            logger.debug('Close called but no active WebSocket connection')
            return

        with suppress(websockets.ConnectionClosed):
            await self._ws_connection.close()
        logger.info('WebSocket connection closed.')

    async def _ensure_active_connection(self):
        """Ensure active connection exists, establishing new one if needed."""
        if self._ws_connection is None or self._ws_connection.state is State.CLOSED:
            logger.debug('No active WebSocket connection; establishing new one')
            await self._establish_new_connection()

    async def _establish_new_connection(self):
        """Create fresh WebSocket connection and start event listening."""
        ws_address = await self._resolve_ws_address()
        logger.info(f'Connecting to {ws_address}')
        self._ws_connection = await self._ws_connector(
            ws_address,
            max_size=1024 * 1024 * 10,  # 10MB
        )
        self._receive_task = asyncio.create_task(self._receive_events())
        logger.debug('WebSocket connection established')

    async def _resolve_ws_address(self):
        """Determine correct WebSocket address based on page ID."""
        if self._ws_address:
            logger.debug('Using provided WebSocket address')
            return self._ws_address
        if not self._page_id:
            resolved = await self._ws_address_resolver(self._connection_port)
            logger.debug(f'Resolved browser-level WebSocket address: {resolved}')
            return resolved
        address = f'ws://localhost:{self._connection_port}/devtools/page/{self._page_id}'
        logger.debug(f'Resolved page-level WebSocket address: {address}')
        return address

    async def _handle_connection_loss(self):
        """Clean up resources after connection loss."""
        if self._ws_connection and self._ws_connection.state is not State.CLOSED:
            await self._ws_connection.close()
        self._ws_connection = None

        if self._receive_task and not self._receive_task.done():
            self._receive_task.cancel()

        logger.info('Connection resources cleaned up')

    async def _receive_events(self):
        """Main loop for receiving and processing WebSocket messages."""
        try:
            async for raw_message in self._incoming_messages():
                await self._process_single_message(raw_message)
        except websockets.ConnectionClosed as e:
            logger.info(f'Connection closed gracefully: {e}')
        except Exception as e:
            logger.error(f'Unexpected error in event loop: {e}')
            raise

    async def _incoming_messages(self) -> AsyncGenerator[Union[str, bytes], None]:
        """Generator yielding raw messages from WebSocket connection."""
        ws = cast(ClientConnection, self._ws_connection)

        while ws.state is not State.CLOSED:
            yield await ws.recv()

    async def _process_single_message(self, raw_message: str):
        """Process single raw WebSocket message."""
        message = self._parse_message(raw_message)
        if not message:
            return

        if self._is_command_response(message):
            message = cast(Response, message)
            await self._handle_command_message(message)
        else:
            message = cast(CDPEvent, message)
            await self._handle_event_message(message)

    @staticmethod
    def _parse_message(raw_message: str) -> Union[CDPEvent, Response, None]:
        """Parse raw message string into JSON object."""
        try:
            return json.loads(raw_message)
        except json.JSONDecodeError:
            logger.warning(f'Failed to parse message: {raw_message[:200]}...')
            return None

    @staticmethod
    def _is_command_response(message: Union[CDPEvent, Response]) -> bool:
        """Determine if message is command response or event notification."""
        return 'id' in message and isinstance(message.get('id'), int)

    async def _handle_command_message(self, message: Response):
        """Process command response messages."""
        logger.debug(f'Processing command response: {message.get("id")}')
        self._command_manager.resolve_command(message['id'], json.dumps(message))

    async def _handle_event_message(self, message: CDPEvent):
        """Process event notification messages."""
        event_type = message.get('method', 'unknown-event')
        logger.debug(f'Processing {event_type} event')
        await self._events_handler.process_event(message)

    def __repr__(self):
        """String representation for debugging."""
        return f'ConnectionHandler(port={self._connection_port})'

    def __str__(self):
        """User-friendly string representation."""
        return f'ConnectionHandler(port={self._connection_port})'

    async def __aenter__(self):
        """Async context manager entry."""
        return self

    async def __aexit__(self, exc_type, exc_val, exc_tb):
        """Async context manager exit with cleanup."""
        await self.close()


================================================
FILE: pydoll/connection/managers/__init__.py
================================================
from pydoll.connection.managers.commands_manager import CommandsManager
from pydoll.connection.managers.events_manager import EventsManager

__all__ = [
    'CommandsManager',
    'EventsManager',
]


================================================
FILE: pydoll/connection/managers/commands_manager.py
================================================
from __future__ import annotations

import asyncio
import logging
from typing import TYPE_CHECKING

if TYPE_CHECKING:
    from pydoll.protocol.base import Command

logger = logging.getLogger(__name__)


class CommandsManager:
    """
    Manages command lifecycle and ID assignment for CDP commands.

    Handles command future creation, ID generation, and response resolution
    for asynchronous command execution.
    """

    def __init__(self) -> None:
        """Initialize command manager with empty state."""
        self._pending_commands: dict[int, asyncio.Future] = {}
        self._id = 1
        logger.debug('CommandsManager initialized')

    def create_command_future(self, command: Command) -> asyncio.Future:
        """
        Create future for command and assign unique ID.

        Args:
            command: Command to prepare for execution.

        Returns:
            Future that resolves when command completes.
        """
        command['id'] = self._id
        future = asyncio.Future()  # type: ignore
        self._pending_commands[self._id] = future
        self._id += 1
        logger.debug(
            f'Created future for command id={command["id"]} method={command.get("method")}'
        )
        return future

    def resolve_command(self, response_id: int, result: str):
        """Resolve pending command with its result."""
        if response_id in self._pending_commands:
            self._pending_commands[response_id].set_result(result)
            del self._pending_commands[response_id]
            logger.debug(f'Resolved command future id={response_id}')

    def remove_pending_command(self, command_id: int):
        """Remove pending command without resolving (for timeouts/cancellations)."""
        if command_id in self._pending_commands:
            del self._pending_commands[command_id]
            logger.debug(f'Removed pending command id={command_id}')


================================================
FILE: pydoll/connection/managers/events_manager.py
================================================
from __future__ import annotations

import asyncio
import logging
from typing import TYPE_CHECKING, cast

from pydoll.protocol.page.events import (
    JavascriptDialogOpeningEvent,
    JavascriptDialogOpeningEventParams,
)

if TYPE_CHECKING:
    from typing import Any, Callable

    from pydoll.protocol.base import CDPEvent
    from pydoll.protocol.network.events import RequestWillBeSentEvent

logger = logging.getLogger(__name__)


class EventsManager:
    """
    Manages event callbacks, processing, and network logs.

    Handles event callback registration, triggering, and maintains state
    for network logs and dialog information.
    """

    def __init__(self) -> None:
        """Initialize events manager with empty state."""
        self._event_callbacks: dict[int, dict] = {}
        self._callback_id = 0
        self.network_logs: list[RequestWillBeSentEvent] = []
        self.dialog = JavascriptDialogOpeningEvent()  # type: ignore
        logger.info('EventsManager initialized')
        logger.debug('Initial state: callbacks=0, logs=0, dialog=empty')

    def register_callback(
        self, event_name: str, callback: Callable[[dict], Any], temporary: bool = False
    ) -> int:
        """
        Register callback for specific event type.

        Args:
            event_name: Event name to listen for.
            callback: Function called when event occurs.
            temporary: If True, callback removed after first trigger.

        Returns:
            Callback ID for later removal.
        """
        self._callback_id += 1
        self._event_callbacks[self._callback_id] = {
            'event': event_name,
            'callback': callback,
            'temporary': temporary,
        }
        logger.info(f"Registered callback '{event_name}' with ID {self._callback_id}")
        logger.debug(
            f'Callback details: temporary={temporary}, total_callbacks={len(self._event_callbacks)}'
        )
        return self._callback_id

    def remove_callback(self, callback_id: int) -> bool:
        """Remove callback by ID."""
        if callback_id not in self._event_callbacks:
            logger.warning(f'Callback ID {callback_id} not found')
            return False

        del self._event_callbacks[callback_id]
        logger.info(f'Removed callback ID {callback_id}')
        logger.debug(f'Remaining callbacks: {len(self._event_callbacks)}')
        return True

    def clear_callbacks(self):
        """Remove all registered callbacks."""
        self._event_callbacks.clear()
        logger.info('All callbacks cleared')
        logger.debug('Callbacks store is now empty')

    async def process_event(self, event_data: CDPEvent):
        """
        Process received event and trigger callbacks.

        Handles special events (network requests, dialogs) and updates
        internal state before triggering registered callbacks.
        """
        event_name = event_data['method']
        logger.debug(f'Processing event: {event_name}')

        if 'Network.requestWillBeSent' in event_name:
            self._update_network_logs(event_data)

        if 'Page.javascriptDialogOpening' in event_name:
            self.dialog = JavascriptDialogOpeningEvent(
                method=event_data['method'],
                params=cast(JavascriptDialogOpeningEventParams, event_data['params']),
            )

        if 'Page.javascriptDialogClosed' in event_name:
            self.dialog = JavascriptDialogOpeningEvent()  # type: ignore

        await self._trigger_callbacks(event_name, event_data)

    def _update_network_logs(self, event_data: RequestWillBeSentEvent):
        """Add network event to logs (keeps last 10000 entries)."""
        self.network_logs.append(event_data)
        self.network_logs = self.network_logs[-10000:]  # keep only last 10000 logs

    async def _trigger_callbacks(self, event_name: str, event_data: CDPEvent):
        """Trigger all registered callbacks for event, removing temporary ones."""
        callbacks_to_remove = []

        for cb_id, cb_data in list(self._event_callbacks.items()):
            if cb_data['event'] == event_name:
                try:
                    if asyncio.iscoroutinefunction(cb_data['callback']):
                        await cb_data['callback'](event_data)
                    else:
                        cb_data['callback'](event_data)
                except Exception as e:
                    logger.error(f'Error in callback {cb_id}: {str(e)}')

                if cb_data['temporary']:
                    callbacks_to_remove.append(cb_id)

        for cb_id in callbacks_to_remove:
            self.remove_callback(cb_id)
        logger.debug(
            f"Triggered callbacks for '{event_name}'. Removed temporaries: {callbacks_to_remove}"
        )


================================================
FILE: pydoll/constants.py
================================================
from enum import Enum, auto


class By(str, Enum):
    CSS_SELECTOR = 'css'
    XPATH = 'xpath'
    CLASS_NAME = 'class_name'
    ID = 'id'
    TAG_NAME = 'tag_name'
    NAME = 'name'


class PageLoadState(str, Enum):
    COMPLETE = 'complete'
    INTERACTIVE = 'interactive'
    LOADING = 'loading'


class ScrollPosition(str, Enum):
    UP = 'up'
    DOWN = 'down'
    LEFT = 'left'
    RIGHT = 'right'


class Scripts:
    ELEMENT_VISIBLE = """
    function() {
        const rect = this.getBoundingClientRect();
        return (
            rect.width > 0 && rect.height > 0
            && getComputedStyle(this).visibility !== 'hidden'
            && getComputedStyle(this).display !== 'none'
        )
    }
    """

    ELEMENT_ON_TOP = """
    function() {
        const rect = this.getBoundingClientRect();
        const x = rect.x + rect.width / 2;
        const y = rect.y + rect.height / 2;
        const elementFromPoint = document.elementFromPoint(x, y);
        if (!elementFromPoint) {
            return false;
        }
        return elementFromPoint === this || this.contains(elementFromPoint);
    }
    """

    ELEMENT_INTERACTIVE = """
    function() {
        const style = window.getComputedStyle(this);
        const rect = this.getBoundingClientRect();
        if (
            rect.width <= 0 ||
            rect.height <= 0 ||
            style.visibility === 'hidden' ||
            style.display === 'none' ||
            style.pointerEvents === 'none'
        ) {
            return false;
        }
        const x = rect.x + rect.width / 2;
        const y = rect.y + rect.height / 2;
        const elementFromPoint = document.elementFromPoint(x, y);
        if (!elementFromPoint || (elementFromPoint !== this && !this.contains(elementFromPoint))) {
            return false;
        }
        if (this.disabled) {
            return false;
        }
        return true;
    }
    """

    CLICK = """
    function(){
        clicked = false;
        this.addEventListener('click', function(){
            clicked = true;
        });
        this.click();
        return clicked;
    }
    """

    CLICK_OPTION_TAG = """
    function() {
        var select = this && this.parentElement ? this.parentElement.closest('select') : null;
        if (!select) { return false; }
        for (var i = 0; i < select.options.length; i++) {
            select.options[i].selected = false;
        }
        this.selected = true;
        select.value = this.value;
        select.dispatchEvent(new Event('input', { bubbles: true }));
        select.dispatchEvent(new Event('change', { bubbles: true }));
        return true;
    }
    """

    BOUNDS = """
    function() {
        return JSON.stringify(this.getBoundingClientRect());
    }
    """

    FIND_RELATIVE_XPATH_ELEMENT = """
        function() {
            return document.evaluate(
                "{escaped_value}", this, null,
                XPathResult.FIRST_ORDERED_NODE_TYPE, null
            ).singleNodeValue;
        }
    """

    FIND_XPATH_ELEMENT = """
        var element = document.evaluate(
            "{escaped_value}", document, null,
            XPathResult.FIRST_ORDERED_NODE_TYPE, null
        ).singleNodeValue;
        element;
    """

    FIND_RELATIVE_XPATH_ELEMENTS = """
        function() {
            var elements = document.evaluate(
                "{escaped_value}", this, null,
                XPathResult.ORDERED_NODE_SNAPSHOT_TYPE, null
            );
            var results = [];
            for (var i = 0; i < elements.snapshotLength; i++) {
                results.push(elements.snapshotItem(i));
            }
            return results;
        }
    """

    FIND_XPATH_ELEMENTS = """
        var elements = document.evaluate(
            "{escaped_value}", document, null,
            XPathResult.ORDERED_NODE_SNAPSHOT_TYPE, null
        );
        var results = [];
        for (var i = 0; i < elements.snapshotLength; i++) {
            results.push(elements.snapshotItem(i));
        }
        results;
    """

    QUERY_SELECTOR = 'document.querySelector("{selector}");'

    RELATIVE_QUERY_SELECTOR = """
        function() {
            return this.querySelector("{selector}");
        }
    """

    QUERY_SELECTOR_ALL = 'document.querySelectorAll("{selector}");'

    RELATIVE_QUERY_SELECTOR_ALL = """
        function() {
            return this.querySelectorAll("{selector}");
        }
    """

    GET_TEXT_BY_XPATH = """
        (() => {
            const node = document.evaluate(
                "{escaped_value}",
                document,
                null,
                XPathResult.FIRST_ORDERED_NODE_TYPE,
                null
            ).singleNodeValue;
            return node ? (node.textContent || "") : "";
        })()
    """

    GET_TEXT_BY_CSS = """
        (() => {
            const el = document.querySelector("{selector}");
            return el ? (el.textContent || "") : "";
        })()
    """

    GET_PARENT_NODE = """
        function() {
            return this.parentElement;
        }
    """

    GET_CHILDREN_NODE = """
        function() {{
            function getChildrenUntilDepth(element, maxDepth, tagFilter = [], currentDepth = 1)
            {{
                if (currentDepth > maxDepth) return [];

                const children = Array.from(element.children);
                let filtered = tagFilter.length === 0
                    ? children
                : children.filter(child => tagFilter.includes(child.tagName.toLowerCase()));

                let allDescendants = [...filtered];

                for (let child of children)
                {{
                    allDescendants.push(
                    ...getChildrenUntilDepth(child, maxDepth, tagFilter, currentDepth + 1)
                    );
                }}

                return allDescendants;
            }}

            return getChildrenUntilDepth(this, {max_depth}, {tag_filter});
        }}
    """

    GET_SIBLINGS_NODE = """
        function() {{
            function getSiblingsUntilDepth(element, tagFilter = [])
            {{
                const parent = element.parentElement;
                const siblings = Array.from(parent.children);
                let filtered = tagFilter.length === 0
                    ? siblings.filter(child => child !== element)
                : siblings.filter(child =>
                    tagFilter.includes(child.tagName.toLowerCase()) && child !== element);

                let allDescendants = [...filtered];

                return allDescendants;
            }}

            return getSiblingsUntilDepth(this, {tag_filter});
        }}
    """

    MAKE_REQUEST = """
(async function() {{
    async function makeRequest(url, options) {{
        try {{
            const response = await fetch(url, options, {{
                credentials: 'include',
            }});
            const headers = {{}};
            response.headers.forEach((value, key) => {{
                headers[key] = value;
            }});

            // Extract cookies from set-cookie header
            const cookies = document.cookie;
            let text = await response.text();
            const possiblePrefixes = [")]}}'\\n", ")]}}'\\n", ")]}}\\n"];
            for (let prefix of possiblePrefixes) {{
                if (text.startsWith(prefix)) {{
                    text = text.substring(prefix.length);
                    break;
                }}
            }}
            let content, jsonData;
            const contentType = response.headers.get('content-type') || '';

            if (contentType.includes('application/json')) {{
                try {{
                    jsonData = JSON.parse(text);
                    text = JSON.stringify(jsonData);
                }} catch (e) {{
                    jsonData = null;
                    // Keep original text if parsing fails
                }}
                content = new TextEncoder().encode(text).buffer;
            }} else {{
                // For non-JSON, keep original text handling
                content = new TextEncoder().encode(text).buffer;
                jsonData = null;
            }}

            return {{
                status: response.status,
                ok: response.ok,
                url: response.url,
                headers: headers,
                cookies: cookies,
                content: Array.from(new Uint8Array(content)),
                text: text,
                json: jsonData
            }};
        }} catch (error) {{
            return {{
                error: error.toString(),
                status: 0
            }};
        }}
    }}

    const url = {url};
    const options = {options};
    return await makeRequest(url, options);
}})();
"""

    SCROLL_BY = """
new Promise((resolve) => {{
    const behavior = '{behavior}';
    if (behavior === 'auto') {{
        window.scrollBy({{
            {axis}: {distance},
            behavior: 'auto'
        }});
        resolve();
    }} else {{
        const onScrollEnd = () => {{
            window.removeEventListener('scrollend', onScrollEnd);
            resolve();
        }};
        window.addEventListener('scrollend', onScrollEnd);
        window.scrollBy({{
            {axis}: {distance},
            behavior: 'smooth'
        }});
        setTimeout(() => {{
            window.removeEventListener('scrollend', onScrollEnd);
            resolve();
        }}, 2000);
    }}
}});
"""

    SCROLL_TO_TOP = """
new Promise((resolve) => {{
    const behavior = '{behavior}';
    if (behavior === 'auto') {{
        window.scrollTo({{
            top: 0,
            behavior: 'auto'
        }});
        resolve();
    }} else {{
        const onScrollEnd = () => {{
            window.removeEventListener('scrollend', onScrollEnd);
            resolve();
        }};
        window.addEventListener('scrollend', onScrollEnd);
        window.scrollTo({{
            top: 0,
            behavior: 'smooth'
        }});
        setTimeout(() => {{
            window.removeEventListener('scrollend', onScrollEnd);
            resolve();
        }}, 2000);
    }}
}});
"""

    SCROLL_TO_BOTTOM = """
new Promise((resolve) => {{
    const behavior = '{behavior}';
    if (behavior === 'auto') {{
        window.scrollTo({{
            top: document.body.scrollHeight,
            behavior: 'auto'
        }});
        resolve();
    }} else {{
        const onScrollEnd = () => {{
            window.removeEventListener('scrollend', onScrollEnd);
            resolve();
        }};
        window.addEventListener('scrollend', onScrollEnd);
        window.scrollTo({{
            top: document.body.scrollHeight,
            behavior: 'smooth'
        }});
        setTimeout(() => {{
            window.removeEventListener('scrollend', onScrollEnd);
            resolve();
        }}, 2000);
    }}
}});
"""

    GET_SCROLL_Y = 'window.scrollY || window.pageYOffset || 0'

    GET_REMAINING_SCROLL_TO_BOTTOM = """
(function() {
    const scrollHeight = Math.max(
        document.body.scrollHeight,
        document.documentElement.scrollHeight
    );
    const clientHeight = window.innerHeight;
    const scrollTop = window.scrollY || window.pageYOffset || 0;
    return Math.max(0, scrollHeight - clientHeight - scrollTop);
})()
"""

    GET_VIEWPORT_CENTER = 'JSON.stringify([window.innerWidth / 2, window.innerHeight / 2])'

    INSERT_TEXT = """
    function() {
        const el = this;
        const text = arguments[0];

        // Standard input/textarea
        if (el.tagName === 'INPUT' || el.tagName === 'TEXTAREA') {
            const start = el.selectionStart || el.value.length;
            const end = el.selectionEnd || el.value.length;
            const before = el.value.substring(0, start);
            const after = el.value.substring(end);
            el.value = before + text + after;
            el.selectionStart = el.selectionEnd = start + text.length;
            el.dispatchEvent(new Event('input', { bubbles: true }));
            el.dispatchEvent(new Event('change', { bubbles: true }));
            return true;
        }

        // ContentEditable elements
        if (el.isContentEditable) {
            el.focus();
            const selection = window.getSelection();
            const range = selection.getRangeAt(0);
            range.deleteContents();
            const textNode = document.createTextNode(text);
            range.insertNode(textNode);
            range.setStartAfter(textNode);
            range.setEndAfter(textNode);
            selection.removeAllRanges();
            selection.addRange(range);
            el.dispatchEvent(new Event('input', { bubbles: true }));
            return true;
        }

        return false;
    }
    """

    CLEAR_INPUT = """
    function() {
        const el = this;

        // Standard input/textarea
        if (el.tagName === 'INPUT' || el.tagName === 'TEXTAREA') {
            el.value = '';
            el.dispatchEvent(new Event('input', { bubbles: true }));
            el.dispatchEvent(new Event('change', { bubbles: true }));
            return true;
        }

        // ContentEditable elements
        if (el.isContentEditable) {
            el.focus();
            el.innerHTML = '';
            el.dispatchEvent(new Event('input', { bubbles: true }));
            return true;
        }

        return false;
    }
    """

    IS_EDITABLE = """
    function() {
        const el = this;

        // Check standard input elements
        if (el.tagName === 'INPUT' || el.tagName === 'TEXTAREA') {
            return !el.disabled && !el.readOnly;
        }

        // Check contenteditable (including inherited)
        let current = el;
        while (current) {
            if (current.isContentEditable) {
                return true;
            }
            current = current.parentElement;
        }

        return false;
    }
    """

    IS_OPTION_TAG = """
    function() {
        return !!(this && this.tagName && this.tagName.toLowerCase() === 'option');
    }
    """


class Key(tuple[str, int], Enum):
    BACKSPACE = ('Backspace', 8)
    TAB = ('Tab', 9)
    ENTER = ('Enter', 13)
    SHIFT = ('Shift', 16)
    CONTROL = ('Control', 17)
    ALT = ('Alt', 18)
    PAUSE = ('Pause', 19)
    CAPSLOCK = ('CapsLock', 20)
    ESCAPE = ('Escape', 27)
    SPACE = ('Space', 32)
    PAGEUP = ('PageUp', 33)
    PAGEDOWN = ('PageDown', 34)
    END = ('End', 35)
    HOME = ('Home', 36)
    ARROWLEFT = ('ArrowLeft', 37)
    ARROWUP = ('ArrowUp', 38)
    ARROWRIGHT = ('ArrowRight', 39)
    ARROWDOWN = ('ArrowDown', 40)
    PRINTSCREEN = ('PrintScreen', 44)
    INSERT = ('Insert', 45)
    DELETE = ('Delete', 46)

    DIGIT0 = ('0', 48)
    DIGIT1 = ('1', 49)
    DIGIT2 = ('2', 50)
    DIGIT3 = ('3', 51)
    DIGIT4 = ('4', 52)
    DIGIT5 = ('5', 53)
    DIGIT6 = ('6', 54)
    DIGIT7 = ('7', 55)
    DIGIT8 = ('8', 56)
    DIGIT9 = ('9', 57)

    A = ('A', 65)
    B = ('B', 66)
    C = ('C', 67)
    D = ('D', 68)
    E = ('E', 69)
    F = ('F', 70)
    G = ('G', 71)
    H = ('H', 72)
    I = ('I', 73)  # noqa: E741
    J = ('J', 74)
    K = ('K', 75)
    L = ('L', 76)
    M = ('M', 77)
    N = ('N', 78)
    O = ('O', 79)  # noqa: E741
    P = ('P', 80)
    Q = ('Q', 81)
    R = ('R', 82)
    S = ('S', 83)
    T = ('T', 84)
    U = ('U', 85)
    V = ('V', 86)
    W = ('W', 87)
    X = ('X', 88)
    Y = ('Y', 89)
    Z = ('Z', 90)

    META = ('Meta', 91)
    METARIGHT = ('MetaRight', 92)
    CONTEXTMENU = ('ContextMenu', 93)

    NUMPAD0 = ('Numpad0', 96)
    NUMPAD1 = ('Numpad1', 97)
    NUMPAD2 = ('Numpad2', 98)
    NUMPAD3 = ('Numpad3', 99)
    NUMPAD4 = ('Numpad4', 100)
    NUMPAD5 = ('Numpad5', 101)
    NUMPAD6 = ('Numpad6', 102)
    NUMPAD7 = ('Numpad7', 103)
    NUMPAD8 = ('Numpad8', 104)
    NUMPAD9 = ('Numpad9', 105)
    NUMPADMULTIPLY = ('NumpadMultiply', 106)
    NUMPADADD = ('NumpadAdd', 107)
    NUMPADSUBTRACT = ('NumpadSubtract', 109)
    NUMPADDECIMAL = ('NumpadDecimal', 110)
    NUMPADDIVIDE = ('NumpadDivide', 111)

    F1 = ('F1', 112)
    F2 = ('F2', 113)
    F3 = ('F3', 114)
    F4 = ('F4', 115)
    F5 = ('F5', 116)
    F6 = ('F6', 117)
    F7 = ('F7', 118)
    F8 = ('F8', 119)
    F9 = ('F9', 120)
    F10 = ('F10', 121)
    F11 = ('F11', 122)
    F12 = ('F12', 123)

    NUMLOCK = ('NumLock', 144)
    SCROLLLOCK = ('ScrollLock', 145)

    SEMICOLON = ('Semicolon', 186)
    EQUALSIGN = ('EqualSign', 187)
    COMMA = ('Comma', 188)
    MINUS = ('Minus', 189)
    PERIOD = ('Period', 190)
    SLASH = ('Slash', 191)
    GRAVEACCENT = ('GraveAccent', 192)
    BRACKETLEFT = ('BracketLeft', 219)
    BACKSLASH = ('Backslash', 220)
    BRACKETRIGHT = ('BracketRight', 221)
    QUOTE = ('Quote', 222)


class BrowserType(Enum):
    CHROME = auto()
    EDGE = auto()


class TypoType(str, Enum):
    """Types of realistic typing errors."""

    ADJACENT = 'adjacent'
    TRANSPOSE = 'transpose'
    DOUBLE = 'double'
    SKIP = 'skip'
    MISSED_SPACE = 'missed_space'


DEFAULT_TYPO_PROBABILITY = 0.02


# Mapping from typeable character to (key, code, keycode).
# key:     DOM KeyboardEvent.key value
# code:    DOM KeyboardEvent.code (physical key on US QWERTY)
# keycode: legacy KeyboardEvent.keyCode / virtual key code
#
# Lowercase and uppercase letters share the same code/keycode; only `key` differs.
# Shifted symbol variants (e.g. '!' from '1') use the base key's code/keycode.
CHAR_TO_KEY_INFO: dict[str, tuple[str, str, int]] = {
    # Letters (lowercase)
    'a': ('a', 'KeyA', 65),
    'b': ('b', 'KeyB', 66),
    'c': ('c', 'KeyC', 67),
    'd': ('d', 'KeyD', 68),
    'e': ('e', 'KeyE', 69),
    'f': ('f', 'KeyF', 70),
    'g': ('g', 'KeyG', 71),
    'h': ('h', 'KeyH', 72),
    'i': ('i', 'KeyI', 73),
    'j': ('j', 'KeyJ', 74),
    'k': ('k', 'KeyK', 75),
    'l': ('l', 'KeyL', 76),
    'm': ('m', 'KeyM', 77),
    'n': ('n', 'KeyN', 78),
    'o': ('o', 'KeyO', 79),
    'p': ('p', 'KeyP', 80),
    'q': ('q', 'KeyQ', 81),
    'r': ('r', 'KeyR', 82),
    's': ('s', 'KeyS', 83),
    't': ('t', 'KeyT', 84),
    'u': ('u', 'KeyU', 85),
    'v': ('v', 'KeyV', 86),
    'w': ('w', 'KeyW', 87),
    'x': ('x', 'KeyX', 88),
    'y': ('y', 'KeyY', 89),
    'z': ('z', 'KeyZ', 90),
    # Letters (uppercase)
    'A': ('A', 'KeyA', 65),
    'B': ('B', 'KeyB', 66),
    'C': ('C', 'KeyC', 67),
    'D': ('D', 'KeyD', 68),
    'E': ('E', 'KeyE', 69),
    'F': ('F', 'KeyF', 70),
    'G': ('G', 'KeyG', 71),
    'H': ('H', 'KeyH', 72),
    'I': ('I', 'KeyI', 73),
    'J': ('J', 'KeyJ', 74),
    'K': ('K', 'KeyK', 75),
    'L': ('L', 'KeyL', 76),
    'M': ('M', 'KeyM', 77),
    'N': ('N', 'KeyN', 78),
    'O': ('O', 'KeyO', 79),
    'P': ('P', 'KeyP', 80),
    'Q': ('Q', 'KeyQ', 81),
    'R': ('R', 'KeyR', 82),
    'S': ('S', 'KeyS', 83),
    'T': ('T', 'KeyT', 84),
    'U': ('U', 'KeyU', 85),
    'V': ('V', 'KeyV', 86),
    'W': ('W', 'KeyW', 87),
    'X': ('X', 'KeyX', 88),
    'Y': ('Y', 'KeyY', 89),
    'Z': ('Z', 'KeyZ', 90),
    # Digits
    '0': ('0', 'Digit0', 48),
    '1': ('1', 'Digit1', 49),
    '2': ('2', 'Digit2', 50),
    '3': ('3', 'Digit3', 51),
    '4': ('4', 'Digit4', 52),
    '5': ('5', 'Digit5', 53),
    '6': ('6', 'Digit6', 54),
    '7': ('7', 'Digit7', 55),
    '8': ('8', 'Digit8', 56),
    '9': ('9', 'Digit9', 57),
    # Shifted digits (symbols on number row)
    ')': (')', 'Digit0', 48),
    '!': ('!', 'Digit1', 49),
    '@': ('@', 'Digit2', 50),
    '#': ('#', 'Digit3', 51),
    '$': ('$', 'Digit4', 52),
    '%': ('%', 'Digit5', 53),
    '^': ('^', 'Digit6', 54),
    '&': ('&', 'Digit7', 55),
    '*': ('*', 'Digit8', 56),
    '(': ('(', 'Digit9', 57),
    # Punctuation and symbols (unshifted)
    ' ': (' ', 'Space', 32),
    '-': ('-', 'Minus', 189),
    '=': ('=', 'Equal', 187),
    '[': ('[', 'BracketLeft', 219),
    ']': (']', 'BracketRight', 221),
    '\\': ('\\', 'Backslash', 220),
    ';': (';', 'Semicolon', 186),
    "'": ("'", 'Quote', 222),
    '`': ('`', 'Backquote', 192),
    ',': (',', 'Comma', 188),
    '.': ('.', 'Period', 190),
    '/': ('/', 'Slash', 191),
    # Punctuation and symbols (shifted)
    '_': ('_', 'Minus', 189),
    '+': ('+', 'Equal', 187),
    '{': ('{', 'BracketLeft', 219),
    '}': ('}', 'BracketRight', 221),
    '|': ('|', 'Backslash', 220),
    ':': (':', 'Semicolon', 186),
    '"': ('"', 'Quote', 222),
    '~': ('~', 'Backquote', 192),
    '<': ('<', 'Comma', 188),
    '>': ('>', 'Period', 190),
    '?': ('?', 'Slash', 191),
    # Whitespace
    '\n': ('Enter', 'Enter', 13),
    '\t': ('Tab', 'Tab', 9),
}


QWERTY_NEIGHBORS: dict[str, list[str]] = {
    '1': ['2', 'q'],
    '2': ['1', '3', 'q', 'w'],
    '3': ['2', '4', 'w', 'e'],
    '4': ['3', '5', 'e', 'r'],
    '5': ['4', '6', 'r', 't'],
    '6': ['5', '7', 't', 'y'],
    '7': ['6', '8', 'y', 'u'],
    '8': ['7', '9', 'u', 'i'],
    '9': ['8', '0', 'i', 'o'],
    '0': ['9', '-', 'o', 'p'],
    '-': ['0', '=', 'p', '['],
    '=': ['-', '[', ']'],
    'q': ['1', '2', 'w', 'a', 's'],
    'w': ['q', '2', '3', 'e', 'a', 's', 'd'],
    'e': ['w', '3', '4', 'r', 's', 'd', 'f'],
    'r': ['e', '4', '5', 't', 'd', 'f', 'g'],
    't': ['r', '5', '6', 'y', 'f', 'g', 'h'],
    'y': ['t', '6', '7', 'u', 'g', 'h', 'j'],
    'u': ['y', '7', '8', 'i', 'h', 'j', 'k'],
    'i': ['u', '8', '9', 'o', 'j', 'k', 'l'],
    'o': ['i', '9', '0', 'p', 'k', 'l', ';'],
    'p': ['o', '0', '-', '[', 'l', ';', "'"],
    '[': ['p', '-', '=', ']', ';', "'"],
    ']': ['[', '=', "'"],
    'a': ['q', 'w', 's', 'z', 'x'],
    's': ['q', 'w', 'e', 'a', 'd', 'z', 'x', 'c'],
    'd': ['w', 'e', 'r', 's', 'f', 'x', 'c', 'v'],
    'f': ['e', 'r', 't', 'd', 'g', 'c', 'v', 'b'],
    'g': ['r', 't', 'y', 'f', 'h', 'v', 'b', 'n'],
    'h': ['t', 'y', 'u', 'g', 'j', 'b', 'n', 'm'],
    'j': ['y', 'u', 'i', 'h', 'k', 'n', 'm', ','],
    'k': ['u', 'i', 'o', 'j', 'l', 'm', ',', '.'],
    'l': ['i', 'o', 'p', 'k', ';', ',', '.', '/'],
    ';': ['o', 'p', '[', 'l', "'", '.', '/'],
    "'": ['p', '[', ']', ';', '/'],
    'z': ['a', 's', 'x'],
    'x': ['z', 'a', 's', 'd', 'c'],
    'c': ['x', 's', 'd', 'f', 'v'],
    'v': ['c', 'd', 'f', 'g', 'b'],
    'b': ['v', 'f', 'g', 'h', 'n'],
    'n': ['b', 'g', 'h', 'j', 'm'],
    'm': ['n', 'h', 'j', 'k', ','],
    ',': ['m', 'j', 'k', 'l', '.'],
    '.': [',', 'k', 'l', ';', '/'],
    '/': ['.', 'l', ';', "'"],
    ' ': ['c', 'v', 'b', 'n', 'm'],
}


================================================
FILE: pydoll/decorators.py
================================================
import asyncio
import logging
import traceback
from functools import wraps
from typing import Any, Callable, Coroutine, List, Optional, Type, TypeVar, Union

logger = logging.getLogger(__name__)

T = TypeVar('T')


class RetryConfig:
    def __init__(
        self,
        max_retries: int = 5,
        exceptions: Union[Type[Exception], List[Type[Exception]]] = Exception,
        on_retry: Optional[Callable] = None,
        delay: float = 0,
        exponential_backoff: bool = False,
    ):
        self.max_retries = max_retries
        self.exceptions = exceptions
        self.on_retry = on_retry
        self.delay = delay
        self.exponential_backoff = exponential_backoff

    def calculate_delay(self, attempt: int) -> float:
        if not self.delay:
            return 0
        return self.delay * (2**attempt if self.exponential_backoff else 1)

    async def call_callback(self, caller_instance: Any) -> None:
        if not self.on_retry:
            return

        try:
            await self.on_retry(caller_instance)
        except TypeError as e:
            error_msg = str(e)
            if (
                'takes 1 positional argument but 2 were given' in error_msg
                or 'takes 0 positional arguments but 1 was given' in error_msg
            ):
                try:
                    await self.on_retry()
                    return
                except Exception as e_inner:
                    raise e_inner
            raise e
        except Exception as e:
            raise e

    async def handle_delay(self, attempt: int) -> None:
        """
        Wait for delay.

        Args:
            attempt (int): The current attempt number
        """
        wait_time = self.calculate_delay(attempt)
        if wait_time:
            await asyncio.sleep(wait_time)

    def is_matching_exception(self, exc: Exception) -> bool:
        if isinstance(self.exceptions, (list, tuple)):
            return any(isinstance(exc, e) for e in self.exceptions)
        return isinstance(exc, self.exceptions)


def retry(
    max_retries: int = 5,
    exceptions: Union[Type[Exception], List[Type[Exception]]] = Exception,
    on_retry: Optional[Callable] = None,
    delay: float = 0,
    exponential_backoff: bool = False,
    exception_to_raise: Optional[Exception] = None,
):
    """
    Decorator to try to execute a function again in case of exception.
    For greater control, it is a good practice to specify the exceptions that should be handled.

    Args:
        max_retries (int): Maximum number of attempts
        exceptions (Union[Type[Exception], List[Type[Exception]]]): Exception types that should be
            handled
        on_retry (Optional[Callable], optional): Function called after each failed attempt
        delay (float): Delay between attempts in seconds
        exponential_backoff (bool): If True, increase the delay exponentially

    Usage:
        @retry_on_exception(
            max_retries=3,
            exceptions=[ValueError, TypeError],
            delay=1
        )
        def my_function():
            ...
    """
    config = RetryConfig(
        max_retries=max_retries,
        exceptions=exceptions,
        on_retry=on_retry,
        delay=delay,
        exponential_backoff=exponential_backoff,
    )

    def decorator(
        func: Callable[..., Coroutine[Any, Any, T]],
    ) -> Callable[..., Coroutine[Any, Any, T]]:
        @wraps(func)
        async def wrapper(*args: Any, **kwargs: Any) -> T:
            last_exception: Optional[Exception] = None
            caller_instance = args[0] if args else None

            for attempt in range(config.max_retries + 1):
                try:
                    return await func(*args, **kwargs)
                except Exception as exc:
                    logger.error(
                        f'Error trying to execute the function {func.__name__}: '
                        f'{traceback.format_exc()}'
                    )
                    if not config.is_matching_exception(exc):
                        raise exc

                    last_exception = exc

                    if attempt < config.max_retries:
                        await config.handle_delay(attempt + 1)
                        await config.call_callback(caller_instance)
                    continue

            if last_exception is not None:
                raise exception_to_raise or last_exception

            raise RuntimeError('Unreachable: all retries exhausted without exception')

        return wrapper

    return decorator


================================================
FILE: pydoll/elements/__init__.py
================================================


================================================
FILE: pydoll/elements/mixins/__init__.py
================================================
from pydoll.elements.mixins.find_elements_mixin import FindElementsMixin

__all__ = [
    'FindElementsMixin',
]


================================================
FILE: pydoll/elements/mixins/find_elements_mixin.py
================================================
from __future__ import annotations

import asyncio
import logging
from typing import TYPE_CHECKING, Optional, Union, cast, overload

from pydoll.commands import (
    DomCommands,
    RuntimeCommands,
)
from pydoll.connection.connection_handler import ConnectionHandler
from pydoll.constants import By, Scripts
from pydoll.elements.utils import SelectorParser
from pydoll.exceptions import ElementNotFound, WaitElementTimeout

if TYPE_CHECKING:
    from typing import Literal, Optional, Union

    from pydoll.elements.web_element import WebElement
    from pydoll.interactions.iframe import IFrameContext
    from pydoll.protocol.base import Command, T_CommandParams, T_CommandResponse
    from pydoll.protocol.dom.methods import DescribeNodeResponse
    from pydoll.protocol.dom.types import Node
    from pydoll.protocol.runtime.methods import (
        CallFunctionOnParams,
        CallFunctionOnResponse,
        EvaluateParams,
        EvaluateResponse,
        GetPropertiesResponse,
    )


logger = logging.getLogger(__name__)


def create_web_element(*args, **kwargs):
    """
    Create WebElement instance avoiding circular imports.

    Factory method that dynamically imports WebElement at runtime
    to prevent circular import dependencies.
    """
    from pydoll.elements.web_element import WebElement  # noqa: PLC0415

    return WebElement(*args, **kwargs)


class FindElementsMixin:
    """
    Mixin providing comprehensive element finding and waiting capabilities.

    Implements DOM element location using various selector strategies (CSS, XPath, etc.)
    with support for single/multiple element finding and configurable waiting.
    Classes using this mixin gain powerful element discovery without implementing
    complex location logic themselves.
    """

    _css_only: bool = False

    if TYPE_CHECKING:
        _connection_handler: ConnectionHandler

    @staticmethod
    def _build_text_expression(selector: str, method: str) -> Optional[str]:
        """
        Build JS expression using Scripts to extract textContent based on selector type.
        """
        return SelectorParser.build_text_expression(selector, method)

    @overload
    async def find(
        self,
        id: Optional[str] = ...,
        class_name: Optional[str] = ...,
        name: Optional[str] = ...,
        tag_name: Optional[str] = ...,
        text: Optional[str] = ...,
        timeout: int = ...,
        find_all: Literal[False] = False,
        raise_exc: Literal[True] = True,
        **attributes,
    ) -> WebElement: ...

    @overload
    async def find(
        self,
        id: Optional[str] = ...,
        class_name: Optional[str] = ...,
        name: Optional[str] = ...,
        tag_name: Optional[str] = ...,
        text: Optional[str] = ...,
        timeout: int = ...,
        find_all: Literal[False] = False,
        raise_exc: Literal[False] = False,
        **attributes,
    ) -> Optional[WebElement]: ...

    @overload
    async def find(
        self,
        id: Optional[str] = ...,
        class_name: Optional[str] = ...,
        name: Optional[str] = ...,
        tag_name: Optional[str] = ...,
        text: Optional[str] = ...,
        timeout: int = ...,
        find_all: Literal[True] = True,
        raise_exc: Literal[True] = True,
        **attributes,
    ) -> list[WebElement]: ...

    @overload
    async def find(
        self,
        id: Optional[str] = ...,
        class_name: Optional[str] = ...,
        name: Optional[str] = ...,
        tag_name: Optional[str] = ...,
        text: Optional[str] = ...,
        timeout: int = ...,
        find_all: Literal[True] = True,
        raise_exc: Literal[False] = False,
        **attributes,
    ) -> Optional[list[WebElement]]: ...

    @overload
    async def find(
        self,
        id: Optional[str] = ...,
        class_name: Optional[str] = ...,
        name: Optional[str] = ...,
        tag_name: Optional[str] = ...,
        text: Optional[str] = ...,
        timeout: int = ...,
        find_all: bool = ...,
        raise_exc: bool = ...,
        **attributes,
    ) -> Union[WebElement, list[WebElement], None]: ...

    async def find(
        self,
        id: Optional[str] = None,
        class_name: Optional[str] = None,
        name: Optional[str] = None,
        tag_name: Optional[str] = None,
        text: Optional[str] = None,
        timeout: int = 0,
        find_all: bool = False,
        raise_exc: bool = True,
        **attributes: dict[str, str],
    ) -> Union[WebElement, list[WebElement], None]:
        """
        Find element(s) using combination of common HTML attributes.

        Flexible element location using standard attributes. Multiple attributes
        can be combined for specific selectors (builds XPath when multiple specified).

        Args:
            id: Element ID attribute value.
            class_name: CSS class name to match.
            name: Element name attribute value.
            tag_name: HTML tag name (e.g., "div", "input").
            text: Text content to match within element.
            timeout: Maximum seconds to wait for elements to appear.
            find_all: If True, returns all matches; if False, first match only.
            raise_exc: Whether to raise exception if no elements found.
            **attributes: Additional HTML attributes to match.

        Returns:
            WebElement, list[WebElement], or None based on find_all and raise_exc.

        Raises:
            ValueError: If no search criteria provided.
            ElementNotFound: If no elements found and raise_exc=True.
            WaitElementTimeout: If timeout specified and no elements appear in time.
            NotImplementedError: If called on a ShadowRoot (use query() with CSS instead).
        """
        if self._css_only:
            raise NotImplementedError(
                'find() is not supported on ShadowRoot. Use query() with a CSS selector instead.'
            )

        logger.debug(
            f'find() called with id={id}, class_name={class_name}, name={name}, '
            f'tag_name={tag_name}, text={text}, timeout={timeout}, '
            f'find_all={find_all}, raise_exc={raise_exc}, attrs={attributes}'
        )
        if not any([id, class_name, name, tag_name, text, *attributes.keys()]):
            raise ValueError(
                'At least one of the following arguments must be provided: id, '
                'class_name, name, tag_name, text'
            )

        by_map = {
            'id': By.ID,
            'class_name': By.CLASS_NAME,
            'name': By.NAME,
            'tag_name': By.TAG_NAME,
            'xpath': By.XPATH,
        }
        by, value = self._get_by_and_value(
            by_map, id, class_name, name, tag_name, text, **attributes
        )
        logger.debug(f'find() resolved to by={by} value={value}')
        return await self.find_or_wait_element(
            by, value, timeout=timeout, find_all=find_all, raise_exc=raise_exc
        )

    @overload
    async def query(
        self,
        expression: str,
        timeout: int = ...,
        find_all: Literal[False] = False,
        raise_exc: Literal[True] = True,
    ) -> WebElement: ...

    @overload
    async def query(
        self,
        expression: str,
        timeout: int = ...,
        find_all: Literal[False] = False,
        raise_exc: Literal[False] = False,
    ) -> Optional[WebElement]: ...

    @overload
    async def query(
        self,
        expression: str,
        timeout: int = ...,
        find_all: Literal[True] = True,
        raise_exc: Literal[True] = True,
    ) -> list[WebElement]: ...

    @overload
    async def query(
        self,
        expression: str,
        timeout: int = ...,
        find_all: Literal[True] = True,
        raise_exc: Literal[False] = False,
    ) -> Optional[list[WebElement]]: ...

    @overload
    async def query(
        self,
        expression: str,
        timeout: int = ...,
        find_all: bool = ...,
        raise_exc: bool = ...,
    ) -> Union[WebElement, list[WebElement], None]: ...

    async def query(
        self, expression: str, timeout: int = 0, find_all: bool = False, raise_exc: bool = True
    ) -> Union[WebElement, list[WebElement], None]:
        """
        Find element(s) using raw CSS selector or XPath expression.

        Direct access using CSS or XPath syntax. Selector type automatically
        determined based on expression pattern.

        Args:
            expression: Selector expression (CSS, XPath, ID with #, class with .).
            timeout: Maximum seconds to wait for elements to appear.
            find_all: If True, returns all matches; if False, first match only.
            raise_exc: Whether to raise exception if no elements found.

        Returns:
            WebElement, list[WebElement], or None based on find_all and raise_exc.

        Raises:
            ElementNotFound: If no elements found and raise_exc=True.
            WaitElementTimeout: If timeout specified and no elements appear in time.
            NotImplementedError: If called with XPath on a ShadowRoot.
        """
        if self._css_only and self._get_expression_type(expression) == By.XPATH:
            raise NotImplementedError(
                'XPath is not supported on ShadowRoot. Use a CSS selector instead.'
            )

        logger.debug(
            f'query() called with expression={expression}, timeout={timeout}, '
            f'find_all={find_all}, raise_exc={raise_exc}'
        )
        by = self._get_expression_type(expression)
        logger.debug(f'query() resolved to by={by}')
        return await self.find_or_wait_element(
            by=by, value=expression, timeout=timeout, find_all=find_all, raise_exc=raise_exc
        )

    async def find_or_wait_element(
        self,
        by: By,
        value: str,
        timeout: int = 0,
        find_all: bool = False,
        raise_exc: bool = True,
    ) -> Union[WebElement, list[WebElement], None]:
        """
        Core element finding method with optional waiting capability.

        Searches for elements with flexible waiting. If timeout specified,
        repeatedly attempts to find elements with 0.5s delays until success or timeout.
        Used by higher-level find() and query() methods.

        Args:
            by: Selector strategy (CSS_SELECTOR, XPATH, ID, etc.).
            value: Selector value to locate element(s).
            timeout: Maximum seconds to wait (0 = no waiting).
            find_all: If True, returns all matches; if False, first match only.
            raise_exc: Whether to raise exception if no elements found.

        Returns:
            WebElement, list[WebElement], or None based on find_all and raise_exc.

        Raises:
            ElementNotFound: If no elements found with timeout=0 and raise_exc=True.
            WaitElementTimeout: If elements not found within timeout and raise_exc=True.
        """
        logger.debug(
            f'find_or_wait_element(): by={by}, value={value}, timeout={timeout}, '
            f'find_all={find_all}, raise_exc={raise_exc}'
        )

        if by == By.XPATH:
            segments = SelectorParser.parse_iframe_segments_xpath(value)
        elif by == By.CSS_SELECTOR:
            segments = SelectorParser.parse_iframe_segments_css(value)
        else:
            segments = [(by, value)]

        if len(segments) > 1:
            return await self._find_across_iframes(segments, timeout, find_all, raise_exc)

        find_method = self._find_element if not find_all else self._find_elements
        start_time = asyncio.get_event_loop().time()

        if not timeout:
            logger.debug('No timeout specified; performing single attempt')
            return await find_method(by, value, raise_exc=raise_exc)

        while True:
            element = await find_method(by, value, raise_exc=False)
            if element:
                if isinstance(element, list):
                    logger.debug(f'Found {len(element)} elements within timeout window')
                else:
                    logger.debug('Found 1 element within timeout window')
                return element

            if asyncio.get_event_loop().time() - start_time > timeout:
                if raise_exc:
                    logger.error('Timeout while waiting for elements')
                    raise WaitElementTimeout(
                        f'Timed out after {timeout}s waiting for element '
                        f'(by={by.value}, value={value!r})'
                    )
                return None

            await asyncio.sleep(0.5)

    async def _find_across_iframes(
        self,
        segments: list[tuple[By, str]],
        timeout: int,
        find_all: bool,
        raise_exc: bool,
    ) -> Union[WebElement, list[WebElement], None]:
        """
        Retry loop for iframe-crossing element searches.

        Repeatedly calls :meth:`_attempt_find_across_iframes` until the target
        element is found or the *timeout* expires.

        Args:
            segments: Ordered ``(By, selector)`` pairs — one per iframe boundary
                plus a final selector for the target element(s).
            timeout: Maximum seconds to wait (0 = single attempt).
            find_all: If ``True``, the last segment uses ``_find_elements``.
            raise_exc: Whether to raise on failure.

        Returns:
            The found element(s), or ``None`` / ``[]`` on failure.

        Raises:
            ElementNotFound: If ``timeout=0``, nothing found, and ``raise_exc=True``.
            WaitElementTimeout: If timeout expires and ``raise_exc=True``.
        """
        start_time = asyncio.get_event_loop().time()
        selector_repr = ' -> '.join(seg for _, seg in segments)

        while True:
            result = await self._attempt_find_across_iframes(segments, find_all)
            if result is not None and result != []:
                return result

            if not timeout:
                if raise_exc:
                    raise ElementNotFound(f'Element not found across iframes: {selector_repr}')
                return [] if find_all else None

            if asyncio.get_event_loop().time() - start_time > timeout:
                if raise_exc:
                    raise WaitElementTimeout(
                        f'Timed out after {timeout}s waiting for element '
                        f'across iframes: {selector_repr}'
                    )
                return [] if find_all else None

            await asyncio.sleep(0.5)

    async def _attempt_find_across_iframes(
        self,
        segments: list[tuple[By, str]],
        find_all: bool,
    ) -> Union[WebElement, list[WebElement], None]:
        """
        Single attempt to walk iframe segments and find the target element.

        For each intermediate segment, finds a single iframe element and uses it
        as the search context for the next segment. The last segment respects
        *find_all*.

        Args:
            segments: Ordered ``(By, selector)`` pairs.
            find_all: Whether the final segment should return all matches.

        Returns:
            Found element(s) or ``None`` / ``[]`` if any intermediate step fails.
        """
        current_context: FindElementsMixin = self
        for i, (by, selector) in enumerate(segments):
            is_last = i == len(segments) - 1
            if is_last:
                if find_all:
                    result = await current_context._find_elements(by, selector, raise_exc=False)
                    return result if result else []
                return await current_context._find_element(by, selector, raise_exc=False)

            element = await current_context._find_element(by, selector, raise_exc=False)
            if not element or not getattr(element, 'is_iframe', False):
                return None
            current_context = element
        return None

    async def _find_element(
        self, by: By, value: str, raise_exc: bool = True
    ) -> Optional[WebElement]:
        """
        Find first element matching selector.

        Internal method performing actual element search. Can be called directly
        for fine-grained control. Searches in document context or relative to
        current element (when used from WebElement).

        Args:
            by: Selector strategy (CSS_SELECTOR, XPATH, ID, etc.).
            value: Selector value to locate element.
            raise_exc: Whether to raise ElementNotFound if not found.

        Returns:
            WebElement instance or None if not found and raise_exc=False.

        Raises:
            ElementNotFound: If element not found and raise_exc=True.
        """
        logger.debug(f'_find_element(): by={by}, value={value}, raise_exc={raise_exc}')
        iframe_context = None
        if getattr(self, 'is_iframe', False):
            element_self = cast('WebElement', self)
            iframe_context = await element_self.iframe_context

        if iframe_context:
            command = self._get_find_element_command(
                by,
                value,
                object_id=iframe_context.document_object_id or '',
                execution_context_id=iframe_context.execution_context_id,
            )
        elif hasattr(self, '_object_id'):
            command = self._get_find_element_command(by, value, self._object_id)
        else:
            command = self._get_find_element_command(by, value)

        response_for_command: Union[
            EvaluateResponse, CallFunctionOnResponse
        ] = await self._execute_command(command)

        if not self._has_object_id_key(response_for_command):
            if raise_exc:
                logger.debug('Element not found and raise_exc=True')
                raise ElementNotFound()
            return None

        object_id = response_for_command['result']['result']['objectId']
        attributes = await self._get_object_attributes(object_id=object_id)
        logger.debug(f'_find_element() found object_id={object_id}')
        element = create_web_element(
            object_id,
            self._connection_handler,
            by,
            value,
            attributes,
            mouse=getattr(self, '_mouse', None),
        )
        self._apply_iframe_context_to_element(
            element, iframe_context or getattr(self, '_iframe_context', None)
        )
        return element

    async def _find_elements(self, by: By, value: str, raise_exc: bool = True) -> list[WebElement]:
        """
        Find all elements matching selector.

        Internal method performing actual multi-element search. Can be called directly
        for fine-grained control. Searches in document context or relative to
        current element (when used from WebElement).

        Args:
            by: Selector strategy (CSS_SELECTOR, XPATH, ID, etc.).
            value: Selector value to locate elements.
            raise_exc: Whether to raise ElementNotFound if none found.

        Returns:
            list of WebElement instances (empty if none found and raise_exc=False).

        Raises:
            ElementNotFound: If no elements found and raise_exc=True.
        """
        logger.debug(f'_find_elements(): by={by}, value={value}, raise_exc={raise_exc}')
        iframe_context = None
        if getattr(self, 'is_iframe', False):
            element_self = cast('WebElement', self)
            iframe_context = await element_self.iframe_context

        if iframe_context:
            command = self._get_find_elements_command(
                by,
                value,
                object_id=iframe_context.document_object_id or '',
                execution_context_id=iframe_context.execution_context_id,
            )
        elif hasattr(self, '_object_id'):
            command = self._get_find_elements_command(by, value, self._object_id)
        else:
            command = self._get_find_elements_command(by, value)

        response_for_command: Union[
            EvaluateResponse, CallFunctionOnResponse
        ] = await self._execute_command(command)

        if not response_for_command.get('result', {}).get('result', {}).get('objectId'):
            if raise_exc:
                logger.debug('No elements found and raise_exc=True')
                raise ElementNotFound()
            return []

        object_id = response_for_command['result']['result']['objectId']
        query_response: GetPropertiesResponse = await self._execute_command(
            RuntimeCommands.get_properties(object_id=object_id)
        )
        response: list[str] = []
        for query in query_response['result']['result']:
            if not (query['name'].isdigit() and 'objectId' in query['value']):
                continue
            response.append(query['value']['objectId'])

        inherited_context = iframe_context or getattr(self, '_iframe_context', None)
        elements = []
        for object_id in response:
            try:
                node_description = await self._describe_node(object_id=object_id)
            except KeyError:
                continue

            attributes = node_description.get('attributes', [])
            tag_name = node_description.get('nodeName', '').lower()
            attributes.extend(['tag_name', tag_name])

            child = create_web_element(
                object_id,
                self._connection_handler,
                by,
                value,
                attributes,
                mouse=getattr(self, '_mouse', None),
            )
            self._apply_iframe_context_to_element(child, inherited_context)
            elements.append(child)
        logger.debug(f'_find_elements() returning {len(elements)} elements')
        return elements

    async def _get_object_attributes(self, object_id: str) -> list[str]:
        """
        Get attributes of a DOM node.
        """
        node_description = await self._describe_node(object_id=object_id)
        if not node_description:
            # If the node couldn't be described (e.g., object id doesn't reference a Node),
            # return minimal attributes to keep the flow stable.
            return ['tag_name', '']
        attributes = node_description.get('attributes', [])
        tag_name = node_description.get('nodeName', '').lower()
        attributes.extend(['tag_name', tag_name])
        return attributes

    def _get_by_and_value(
        self,
        by_map: dict[str, By],
        id: Optional[str] = None,
        class_name: Optional[str] = None,
        name: Optional[str] = None,
        tag_name: Optional[str] = None,
        text: Optional[str] = None,
        **attributes,
    ) -> tuple[By, str]:
        """
        Determine appropriate selector strategy and value from provided arguments.

        For single attribute: uses direct selector strategy.
        For multiple attributes: builds XPath expression.
        """
        logger.debug(
            f'_get_by_and_value(): id={id}, class_name={class_name}, name={name}, '
            f'tag_name={tag_name}, text={text}, attrs={attributes}'
        )
        xpath_raw = attributes.get('xpath')
        if isinstance(xpath_raw, str) and xpath_raw:
            logger.debug(f'Explicit XPath provided; using raw expression: {xpath_raw}')
            return By.XPATH, xpath_raw

        simple_selectors = {
            'id': id,
            'class_name': class_name,
            'name': name,
            'tag_name': tag_name,
        }
        provided_selectors = {key: value for key, value in simple_selectors.items() if value}

        if len(provided_selectors) == 1 and not text and not attributes:
            key, value = next(iter(provided_selectors.items()))
            by = by_map[key]
            logger.debug(f'Simple selector resolved: by={by}, value={value}')
            return by, value

        xpath = self._build_xpath(id, class_name, name, tag_name, text, **attributes)
        logger.debug(f'Complex selector resolved to XPath: {xpath}')
        return By.XPATH, xpath

    @staticmethod
    def _build_xpath(
        id: Optional[str] = None,
        class_name: Optional[str] = None,
        name: Optional[str] = None,
        tag_name: Optional[str] = None,
        text: Optional[str] = None,
        **attributes: str,
    ) -> str:
        """
        Build XPath expression from multiple attribute criteria.

        Constructs complex XPath combining multiple conditions with 'and' operators.
        Handles class names correctly for space-separated class lists.
        Uses contains() for text matching (partial text support).

        Note:
            Attribute names with underscores are automatically converted to hyphens
            to match HTML attribute naming conventions (e.g., data_test -> data-test).
        """
        return SelectorParser.build_xpath(id, class_name, name, tag_name, text, **attributes)

    @staticmethod
    def _get_expression_type(expression: str) -> By:
        """
        Auto-detect selector type from expression syntax.

        Patterns:
        - XPath: starts with ./, or /
        - Default: CSS_SELECTOR
        """
        return SelectorParser.get_expression_type(expression)

    async def _describe_node(self, object_id: str = '') -> Node:
        """
        Get detailed DOM node information using CDP DOM.describeNode.

        Used internally to gather data for WebElement initialization.
        """
        response: DescribeNodeResponse = await self._execute_command(
            DomCommands.describe_node(object_id=object_id)
        )
        if 'error' in response:
            # Return empty node structure when CDP reports that the objectId
            # doesn't reference a Node or any other describe error occurs.
            return {}
        return response.get('result', {}).get('node', {})

    def _apply_iframe_context_to_element(
        self, element: WebElement, iframe_context: IFrameContext | None
    ) -> None:
        """
        Propagate iframe context to the newly created element.
        - If the element is also an iframe, configure session routing.
        - Otherwise, inject the iframe's own context.
        """
        if not iframe_context:
            return
        if getattr(element, 'is_iframe', False):
            routing_handler = iframe_context.session_handler or self._connection_handler
            element._routing_session_handler = routing_handler
            element._routing_session_id = iframe_context.session_id
            element._routing_parent_frame_id = iframe_context.frame_id
            return
        element._iframe_context = iframe_context

    def _resolve_routing(self) -> tuple[ConnectionHandler, Optional[str]]:
        """
        Resolve handler and sessionId for the current context (iframe routed or default).
        """
        iframe_context = getattr(self, '_iframe_context', None)
        if iframe_context and getattr(iframe_context, 'session_handler', None):
            return iframe_context.session_handler, getattr(iframe_context, 'session_id', None)
        routing_handler = getattr(self, '_routing_session_handler', None)
        if routing_handler is not None:
            return routing_handler, getattr(self, '_routing_session_id', None)
        return self._connection_handler, None

    async def _execute_command(
        self, command: Command[T_CommandParams, T_CommandResponse]
    ) -> T_CommandResponse:
        """Execute CDP command via resolved handler (60s timeout)."""
        handler, session_id = self._resolve_routing()
        if session_id:
            command['sessionId'] = session_id
        return await handler.execute_command(command, timeout=60)

    def _get_find_element_command(
        self,
        by: By,
        value: str,
        object_id: str = '',
        execution_context_id: Optional[int] = None,
    ):
        """
        Create CDP command for finding single element.

        Handles special cases for different selector types and contexts:
        - CLASS_NAME/ID: converts to CSS selector
        - Relative searches: uses different scripts for context element
        - XPath: requires special handling
        - NAME: converts to XPath expression
        """
        escaped_value = value.replace('"', '\\"')
        command: Union[
            Command[CallFunctionOnParams, CallFunctionOnResponse],
            Command[EvaluateParams, EvaluateResponse],
        ]
        match by:
            case By.CLASS_NAME:
                selector = f'.{escaped_value}'
            case By.ID:
                selector = f'#{escaped_value}'
            case _:
                selector = escaped_value
        if object_id and not by == By.XPATH:
            script = Scripts.RELATIVE_QUERY_SELECTOR.replace('{selector}', selector)
            command = RuntimeCommands.call_function_on(
                function_declaration=script,
                object_id=object_id,
                return_by_value=False,
            )
        elif by == By.XPATH:
            command = self._get_find_element_by_xpath_command(
                value, object_id=object_id, execution_context_id=execution_context_id
            )
        elif by == By.NAME:
            command = self._get_find_element_by_xpath_command(
                f'//*[@name="{escaped_value}"]',
                object_id=object_id,
                execution_context_id=execution_context_id,
            )
        else:
            command = RuntimeCommands.evaluate(
                expression=Scripts.QUERY_SELECTOR.replace('{selector}', selector),
                context_id=execution_context_id,
            )
        return command

    def _get_find_elements_command(
        self,
        by: By,
        value: str,
        object_id: str = '',
        execution_context_id: Optional[int] = None,
    ):
        """
        Create CDP command for finding multiple elements.

        Similar to _get_find_element_command but for multiple element searches.
        Handles same special cases and selector type conversions.
        """
        escaped_value = value.replace('"', '\\"')
        command: Union[
            Command[CallFunctionOnParams, CallFunctionOnResponse],
            Command[EvaluateParams, EvaluateResponse],
        ]
        match by:
            case By.CLASS_NAME:
                selector = f'.{escaped_value}'
            case By.ID:
                selector = f'#{escaped_value}'
            case _:
                selector = escaped_value
        if object_id and not by == By.XPATH:
            script = Scripts.RELATIVE_QUERY_SELECTOR_ALL.replace('{selector}', selector)
            command = RuntimeCommands.call_function_on(
                function_declaration=script,
                object_id=object_id,
                return_by_value=False,
            )
        elif by == By.XPATH:
            command = self._get_find_elements_by_xpath_command(
                value, object_id=object_id, execution_context_id=execution_context_id
            )
        else:
            command = RuntimeCommands.evaluate(
                expression=Scripts.QUERY_SELECTOR_ALL.replace('{selector}', selector),
                context_id=execution_context_id,
            )
        return command

    def _get_find_element_by_xpath_command(
        self,
        xpath: str,
        object_id: str,
        execution_context_id: Optional[int] = None,
    ):
        """
        Create CDP command specifically for XPath single element finding.

        XPath requires special handling vs CSS selectors. Ensures relative
        XPath for context-based searches.
        """
        command: Union[
            Command[CallFunctionOnParams, CallFunctionOnResponse],
            Command[EvaluateParams, EvaluateResponse],
        ]
        escaped_value = xpath.replace('"', '\\"')
        if object_id:
            escaped_value = self._ensure_relative_xpath(escaped_value)
            script = Scripts.FIND_RELATIVE_XPATH_ELEMENT.replace('{escaped_value}', escaped_value)
            command = RuntimeCommands.call_function_on(
                function_declaration=script,
                object_id=object_id,
                return_by_value=False,
            )
        else:
            script = Scripts.FIND_XPATH_ELEMENT.replace('{escaped_value}', escaped_value)
            command = RuntimeCommands.evaluate(expression=script, context_id=execution_context_id)
        return command

    def _get_find_elements_by_xpath_command(
        self,
        xpath: str,
        object_id: str,
        execution_context_id: Optional[int] = None,
    ):
        """
        Create CDP command specifically for XPath multiple element finding.

        XPath requires special handling vs CSS selectors. Ensures relative
        XPath for context-based searches.
        """
        escaped_value = xpath.replace('"', '\\"')
        command: Union[
            Command[CallFunctionOnParams, CallFunctionOnResponse],
            Command[EvaluateParams, EvaluateResponse],
        ]
        if object_id:
            escaped_value = self._ensure_relative_xpath(escaped_value)
            script = Scripts.FIND_RELATIVE_XPATH_ELEMENTS.replace('{escaped_value}', escaped_value)
            command = RuntimeCommands.call_function_on(
                function_declaration=script,
                object_id=object_id,
                return_by_value=False,
            )
        else:
            script = Scripts.FIND_XPATH_ELEMENTS.replace('{escaped_value}', escaped_value)
            command = RuntimeCommands.evaluate(expression=script, context_id=execution_context_id)
        return command

    @staticmethod
    def _ensure_relative_xpath(xpath: str) -> str:
        """
        Ensure XPath is relative by prepending dot if needed.

        Converts absolute XPath to relative for context-based searches.
        """
        return SelectorParser.ensure_relative_xpath(xpath)

    @staticmethod
    def _has_object_id_key(response: Union[EvaluateResponse, CallFunctionOnResponse]) -> bool:
        """
        Check if response has objectId key.
        """
        return bool(response.get('result', {}).get('result', {}).get('objectId'))


================================================
FILE: pydoll/elements/shadow_root.py
================================================
from __future__ import annotations

import logging
from typing import TYPE_CHECKING

from pydoll.commands import DomCommands
from pydoll.connection import ConnectionHandler
from pydoll.elements.mixins import FindElementsMixin
from pydoll.protocol.dom.types import ShadowRootType

if TYPE_CHECKING:
    from pydoll.elements.web_element import WebElement
    from pydoll.protocol.dom.methods import GetOuterHTMLResponse

logger = logging.getLogger(__name__)


class ShadowRoot(FindElementsMixin):
    """
    Shadow root wrapper for shadow DOM traversal.

    Provides element finding capabilities within shadow DOM boundaries
    using query() with CSS selectors. Use query() instead of find() —
    find() and XPath are not supported inside shadow roots.

    Usage:
        shadow_host = await tab.find(id='my-component')
        shadow_root = await shadow_host.get_shadow_root()
        button = await shadow_root.query('#internal-button')
        await button.click()
    """

    _css_only = True

    def __init__(
        self,
        object_id: str,
        connection_handler: ConnectionHandler,
        mode: ShadowRootType = ShadowRootType.OPEN,
        host_element: WebElement | None = None,
    ):
        """
        Initialize shadow root wrapper.

        Args:
            object_id: CDP object ID for the shadow root node.
            connection_handler: Browser connection for CDP commands.
            mode: Shadow root mode (open, closed, or user-agent).
            host_element: Reference to the shadow host element.
        """
        self._object_id = object_id
        self._connection_handler = connection_handler
        self._mode = mode
        self._host_element = host_element

        # Inherit iframe/routing context from host element if present
        if host_element:
            self._iframe_context = getattr(host_element, '_iframe_context', None)
            self._routing_session_handler = getattr(host_element, '_routing_session_handler', None)
            self._routing_session_id = getattr(host_element, '_routing_session_id', None)
            self._routing_parent_frame_id = getattr(host_element, '_routing_parent_frame_id', None)

        logger.debug(
            f'ShadowRoot initialized: object_id={self._object_id}, mode={self._mode.value}'
        )

    @property
    def mode(self) -> ShadowRootType:
        """Shadow root mode (open, closed, or user-agent)."""
        return self._mode

    @property
    def host_element(self) -> WebElement | None:
        """Reference to the shadow host element, if available."""
        return self._host_element

    @property
    async def inner_html(self) -> str:
        """HTML content of the shadow root."""
        response: GetOuterHTMLResponse = await self._execute_command(
            DomCommands.get_outer_html(object_id=self._object_id)
        )
        return response['result']['outerHTML']

    def __repr__(self) -> str:
        return f'ShadowRoot(mode={self._mode.value}, object_id={self._object_id})'

    def __str__(self) -> str:
        return f'ShadowRoot({self._mode.value})'


================================================
FILE: pydoll/elements/utils/__init__.py
================================================
from pydoll.elements.utils.selector_parser import SelectorParser

__all__ = ['SelectorParser']


================================================
FILE: pydoll/elements/utils/selector_parser.py
================================================
"""
Selector parsing and building utilities for element finding.

Centralises all logic that inspects, builds, or transforms CSS and XPath
selector strings. This keeps the mixin layer focused on orchestration
(finding elements, managing timeouts, issuing CDP commands) while the
pure string-manipulation lives here.
"""

from __future__ import annotations

import logging
import re
from typing import Optional

from pydoll.constants import By, Scripts
from pydoll.utils import normalize_synthetic_xpath

logger = logging.getLogger(__name__)

# ---------------------------------------------------------------------------
# Compiled patterns
# ---------------------------------------------------------------------------

_IFRAME_XPATH_NODE_RE = re.compile(r'^(?:\w+::)?iframe(?:\[|$)', re.IGNORECASE)
_IFRAME_XPATH_GROUPED_RE = re.compile(r'\biframe\b', re.IGNORECASE)
_CSS_TAG_NAME_RE = re.compile(r'^([a-zA-Z][a-zA-Z0-9-]*)')
_XPATH_PREFIXES: list[tuple[str, int]] = [('.//', 3), ('//', 2), ('./', 2), ('/', 1)]

# Lookup tables for the nesting-depth tracker
_QUOTE_TRANSITIONS: dict[str, tuple[int, bool]] = {"'": (0, True), '"': (1, True)}
_DEPTH_TRANSITIONS: dict[str, tuple[int, int]] = {
    '[': (0, 1),
    ']': (0, -1),
    '(': (1, 1),
    ')': (1, -1),
}


class SelectorParser:
    """
    Stateless helper that parses, builds and classifies CSS / XPath selectors.

    Every method is a ``@staticmethod`` — the class is used purely as a
    namespace to keep the parsing surface area together. ``FindElementsMixin``
    delegates all selector string work here.
    """

    # ------------------------------------------------------------------
    # Expression type detection
    # ------------------------------------------------------------------

    @staticmethod
    def get_expression_type(expression: str) -> By:
        """
        Auto-detect selector type from expression syntax.

        Patterns:
        - XPath: starts with ``./``, ``/`` or ``(/``
        - Default: ``By.CSS_SELECTOR``
        """
        if expression.startswith(('./', '/', '(/')):
            return By.XPATH
        return By.CSS_SELECTOR

    # ------------------------------------------------------------------
    # XPath building from keyword criteria
    # ------------------------------------------------------------------

    @staticmethod
    def build_xpath(
        id: Optional[str] = None,
        class_name: Optional[str] = None,
        name: Optional[str] = None,
        tag_name: Optional[str] = None,
        text: Optional[str] = None,
        **attributes: str,
    ) -> str:
        """
        Build XPath expression from multiple attribute criteria.

        Constructs complex XPath combining multiple conditions with ``and``
        operators. Handles class names correctly for space-separated class
        lists. Uses ``contains()`` for text matching (partial text support).

        Note:
            Attribute names with underscores are automatically converted to
            hyphens to match HTML attribute naming conventions
            (e.g. ``data_test`` -> ``data-test``).
        """
        xpath_conditions: list[str] = []
        base_xpath = f'//{tag_name}' if tag_name else '//*'
        if id:
            xpath_conditions.append(f'@id="{id}"')
        if class_name:
            xpath_conditions.append(
                f'contains(concat(" ", normalize-space(@class), " "), " {class_name} ")'
            )
        if name:
            xpath_conditions.append(f'@name="{name}"')
        if text:
            xpath_conditions.append(f'contains(text(), "{text}")')
        for attribute, value in attributes.items():
            html_attribute = attribute.replace('_', '-')
            xpath_conditions.append(f'@{html_attribute}="{value}"')

        xpath = (
            f'{base_xpath}[{" and ".join(xpath_conditions)}]' if xpath_conditions else base_xpath
        )
        logger.debug(f'build_xpath() -> {xpath}')
        return xpath

    # ------------------------------------------------------------------
    # XPath helpers
    # ------------------------------------------------------------------

    @staticmethod
    def ensure_relative_xpath(xpath: str) -> str:
        """
        Ensure XPath is relative by prepending dot if needed.

        Converts absolute XPath to relative for context-based searches.
        """
        return f'.{xpath}' if not xpath.startswith('.') else xpath

    # ------------------------------------------------------------------
    # JS text-expression builder
    # ------------------------------------------------------------------

    @staticmethod
    def build_text_expression(selector: str, method: str) -> Optional[str]:
        """
        Build JS expression using ``Scripts`` to extract ``textContent``
        based on selector type.
        """
        raw = str(selector)
        method_lc = (method or '').lower()

        if 'xpath' in method_lc:
            normalized_xpath = normalize_synthetic_xpath(raw)
            escaped_xpath = normalized_xpath.replace('"', '\\"')
            return Scripts.GET_TEXT_BY_XPATH.replace('{escaped_value}', escaped_xpath)

        if method_lc == 'name':
            escaped_name = raw.replace('"', '\\"')
            xpath = f'//*[@name="{escaped_name}"]'
            return Scripts.GET_TEXT_BY_XPATH.replace('{escaped_value}', xpath)

        escaped = raw.replace('\\', '\\\\').replace('"', '\\"')
        if method_lc == 'id':
            css = f'#{escaped}'
        elif method_lc == 'class_name':
            css = f'.{escaped}'
        elif method_lc == 'tag_name':
            css = escaped
        else:
            css = escaped
        return Scripts.GET_TEXT_BY_CSS.replace('{selector}', css)

    # ------------------------------------------------------------------
    # Iframe-crossing: XPath
    # ------------------------------------------------------------------

    @staticmethod
    def parse_iframe_segments_xpath(expression: str) -> list[tuple[By, str]]:
        """
        Split an XPath expression at iframe boundaries for cross-iframe
        traversal.

        Parses the XPath into steps separated by ``/`` or ``//``, respecting
        quoted strings, brackets and parentheses. Steps whose node test is
        ``iframe`` (case-insensitive) act as split points: everything up to
        and including the iframe step becomes one segment, and the remainder
        starts a new segment prefixed with ``//``.

        Args:
            expression: Raw XPath expression.

        Returns:
            List of ``(By.XPATH, segment)`` tuples.  A single-element list
            when no iframe crossing is detected.
        """
        xpath_steps = SelectorParser._tokenize_xpath_steps(expression)
        if not xpath_steps:
            return [(By.XPATH, expression)]

        iframe_split_indices: list[int] = [
            step_index
            for step_index, (_sep, step_text) in enumerate(xpath_steps)
            if SelectorParser._is_iframe_xpath_step(step_text) and step_index < len(xpath_steps) - 1
        ]

        if not iframe_split_indices:
            return [(By.XPATH, expression)]

        return SelectorParser._build_xpath_segments(xpath_steps, iframe_split_indices)

    # ------------------------------------------------------------------
    # Iframe-crossing: CSS
    # ------------------------------------------------------------------

    @staticmethod
    def parse_iframe_segments_css(expression: str) -> list[tuple[By, str]]:
        """
        Split a CSS selector at iframe boundaries for cross-iframe traversal.

        Tokenises the selector into compound selectors separated by
        combinators (space, ``>``, ``+``, ``~``), respecting quoted strings,
        brackets and parentheses. Compounds whose tag name is ``iframe``
        (case-insensitive) act as split points.

        Args:
            expression: Raw CSS selector.

        Returns:
            List of ``(By.CSS_SELECTOR, segment)`` tuples.  A single-element
            list when no iframe crossing is detected.
        """
        css_compounds = SelectorParser._tokenize_css_compounds(expression)
        if not css_compounds:
            return [(By.CSS_SELECTOR, expression)]

        iframe_split_indices: list[int] = [
            compound_index
            for compound_index, (compound_text, _comb) in enumerate(css_compounds)
            if SelectorParser._is_iframe_css_compound(compound_text)
            and compound_index < len(css_compounds) - 1
        ]

        if not iframe_split_indices:
            return [(By.CSS_SELECTOR, expression)]

        return SelectorParser._build_css_segments(css_compounds, iframe_split_indices)

    # ==================================================================
    # Private helpers
    # ==================================================================

    @staticmethod
    def _is_at_nesting_depth_zero(
        char: str,
        quote_state: list[bool],
        depth_state: list[int],
    ) -> bool:
        """
        Track quote/bracket/paren nesting and return whether char is at
        depth 0.  Mutates *quote_state* and *depth_state* in place.
        """
        if quote_state[0] or quote_state[1]:
            if quote_state[0]:
                quote_state[0] = char != "'"
            else:
                quote_state[1] = char != '"'
            return False

        if char in _QUOTE_TRANSITIONS:
            index, value = _QUOTE_TRANSITIONS[char]
            quote_state[index] = value
            return False

        if char in _DEPTH_TRANSITIONS:
            index, delta = _DEPTH_TRANSITIONS[char]
            depth_state[index] += delta
            return False

        return depth_state[0] == 0 and depth_state[1] == 0

    # -- XPath tokenizer -----------------------------------------------

    @staticmethod
    def _detect_xpath_leading_separator(expression: str) -> tuple[str, int]:
        """Return ``(separator, start_index)`` for the XPath prefix."""
        if expression.startswith('('):
            return '', 0
        for prefix, length in _XPATH_PREFIXES:
            if expression.startswith(prefix):
                return prefix, length
        return '', 0

    @staticmethod
    def _tokenize_xpath_steps(expression: str) -> list[tuple[str, str]]:
        """Tokenize XPath into ``(separator, step_text)`` pairs."""
        xpath_steps: list[tuple[str, str]] = []
        current_separator, token_start = SelectorParser._detect_xpath_leading_separator(expression)
        char_index = token_start
        quote_state = [False, False]
        depth_state = [0, 0]

        while char_index < len(expression):
            char = expression[char_index]
            at_depth_zero = SelectorParser._is_at_nesting_depth_zero(char, quote_state, depth_state)

            if at_depth_zero and char == '/':
                step_text = expression[token_start:char_index]
                if step_text:
                    xpath_steps.append((current_separator, step_text))
                is_double_slash = (
                    char_index + 1 < len(expression) and expression[char_index + 1] == '/'
                )
                current_separator = '//' if is_double_slash else '/'
                char_index += 2 if is_double_slash else 1
                token_start = char_index
                continue
            char_index += 1

        remaining_text = expression[token_start:]
        if remaining_text:
            xpath_steps.append((current_separator, remaining_text))

        return xpath_steps

    @staticmethod
    def _is_iframe_xpath_step(step_text: str) -> bool:
        """Return whether a single XPath step's node test is ``iframe``."""
        if step_text.startswith('('):
            return bool(_IFRAME_XPATH_GROUPED_RE.search(step_text))
        return bool(_IFRAME_XPATH_NODE_RE.match(step_text))

    @staticmethod
    def _build_xpath_segments(
        xpath_steps: list[tuple[str, str]],
        iframe_split_indices: list[int],
    ) -> list[tuple[By, str]]:
        """Reassemble XPath steps into segments split at iframe indices."""
        segments: list[tuple[By, str]] = []
        segment_start = 0

        for split_index in iframe_split_indices:
            segment_parts: list[str] = []
            for step_index in range(segment_start, split_index + 1):
                separator, step_text = xpath_steps[step_index]
                if step_index == segment_start and segment_start != 0:
                    segment_parts.append('//' + step_text)
                else:
                    segment_parts.append(separator + step_text)
            segments.append((By.XPATH, ''.join(segment_parts)))
            segment_start = split_index + 1

        if segment_start < len(xpath_steps):
            segment_parts = []
            for step_index in range(segment_start, len(xpath_steps)):
                separator, step_text = xpath_steps[step_index]
                if step_index == segment_start:
                    segment_parts.append('//' + step_text)
                else:
                    segment_parts.append(separator + step_text)
            segments.append((By.XPATH, ''.join(segment_parts)))

        return segments

    # -- CSS tokenizer --------------------------------------------------

    @staticmethod
    def _tokenize_css_compounds(expression: str) -> list[tuple[str, str | None]]:
        """Tokenize CSS selector into ``(compound_text, combinator_after)`` pairs."""
        css_compounds: list[tuple[str, str | None]] = []
        token_start = 0
        char_index = 0
        quote_state = [False, False]
        depth_state = [0, 0]

        while char_index < len(expression):
            char = expression[char_index]
            at_depth_zero = SelectorParser._is_at_nesting_depth_zero(char, quote_state, depth_state)

            if at_depth_zero and char in ' >+~':
                compound_text = expression[token_start:char_index]
                if not compound_text.strip():
                    char_index += 1
                    continue
                combinator, char_index = SelectorParser._consume_css_combinator(
                    expression, char_index
                )
                css_compounds.append((compound_text, combinator))
                token_start = char_index
                continue
            char_index += 1

        remaining_text = expression[token_start:].strip()
        if remaining_text:
            css_compounds.append((remaining_text, None))

        return css_compounds

    @staticmethod
    def _consume_css_combinator(expression: str, start: int) -> tuple[str, int]:
        """Consume a CSS combinator region and return ``(combinator, next_index)``."""
        char_index = start
        while char_index < len(expression) and expression[char_index] == ' ':
            char_index += 1
        if char_index < len(expression) and expression[char_index] in '>+~':
            combinator = expression[char_index]
            char_index += 1
            while char_index < len(expression) and expression[char_index] == ' ':
                char_index += 1
        else:
            combinator = ' '
        return combinator, char_index

    @staticmethod
    def _is_iframe_css_compound(compound_text: str) -> bool:
        """Return whether a CSS compound selector's tag name is ``iframe``."""
        stripped = compound_text.strip()
        if stripped and stripped[0] in '.#[:':
            return False
        match = _CSS_TAG_NAME_RE.match(stripped)
        if not match:
            return False
        return match.group(1).lower() == 'iframe'

    @staticmethod
    def _format_css_combinator(combinator: str) -> str:
        """Format a CSS combinator for human-readable output."""
        if combinator == ' ':
            return ' '
        return f' {combinator} '

    @staticmethod
    def _build_css_segments(
        css_compounds: list[tuple[str, str | None]],
        iframe_split_indices: list[int],
    ) -> list[tuple[By, str]]:
        """Reassemble CSS compounds into segments split at iframe indices."""
        segments: list[tuple[By, str]] = []
        segment_start = 0

        for split_index in iframe_split_indices:
            segment_parts: list[str] = []
            for compound_index in range(segment_start, split_index + 1):
                compound_text, _combinator = css_compounds[compound_index]
                if compound_index > segment_start:
                    previous_combinator = css_compounds[compound_index - 1][1] or ' '
                    segment_parts.append(SelectorParser._format_css_combinator(previous_combinator))
                segment_parts.append(compound_text)
            segments.append((By.CSS_SELECTOR, ''.join(segment_parts)))
            segment_start = split_index + 1

        if segment_start < len(css_compounds):
            segment_parts = []
            for compound_index in range(segment_start, len(css_compounds)):
                compound_text, _combinator = css_compounds[compound_index]
                if compound_index > segment_start:
                    previous_combinator = css_compounds[compound_index - 1][1] or ' '
                    segment_parts.append(SelectorParser._format_css_combinator(previous_combinator))
                segment_parts.append(compound_text)
            segments.append((By.CSS_SELECTOR, ''.join(segment_parts)))

        return segments


================================================
FILE: pydoll/elements/web_element.py
================================================
from __future__ import annotations

import asyncio
import json
import logging
import warnings
from pathlib import Path
from typing import TYPE_CHECKING, Optional

import aiofiles

from pydoll.commands import (
    DomCommands,
    InputCommands,
    PageCommands,
    RuntimeCommands,
)
from pydoll.connection import ConnectionHandler
from pydoll.constants import (
    Key,
    Scripts,
)
from pydoll.elements.mixins import FindElementsMixin
from pydoll.elements.shadow_root import ShadowRoot
from pydoll.exceptions import (
    ElementNotAFileInput,
    ElementNotFound,
    ElementNotInteractable,
    ElementNotVisible,
    InvalidFileExtension,
    InvalidIFrame,
    MissingScreenshotPath,
    ShadowRootNotFound,
    WaitElementTimeout,
)
from pydoll.interactions.iframe import IFrameContext, IFrameContextResolver
from pydoll.interactions.keyboard import Keyboard
from pydoll.protocol.dom.types import ShadowRootType
from pydoll.protocol.input.types import (
    KeyEventType,
    KeyModifier,
    MouseButton,
    MouseEventType,
)
from pydoll.protocol.page.types import ScreenshotFormat, Viewport
from pydoll.protocol.runtime.methods import (
    CallFunctionOnResponse,
    EvaluateResponse,
    GetPropertiesResponse,
    SerializationOptions,
)
from pydoll.protocol.runtime.types import CallArgument
from pydoll.utils import (
    decode_base64_to_bytes,
    extract_text_from_html,
    is_script_already_function,
)

if TYPE_CHECKING:
    from pydoll.interactions.mouse import Mouse as MouseType
    from pydoll.protocol.dom.methods import (
        DescribeNodeResponse,
        GetBoxModelResponse,
        GetOuterHTMLResponse,
        ResolveNodeResponse,
    )
    from pydoll.protocol.dom.types import Quad
    from pydoll.protocol.page.methods import CaptureScreenshotResponse
    from pydoll.protocol.runtime.methods import GetPropertiesResponse

logger = logging.getLogger(__name__)


class WebElement(FindElementsMixin):  # noqa: PLR0904
    """
    DOM element wrapper for browser automation.

    Provides comprehensive functionality for element interaction, inspection,
    and manipulation using Chrome DevTools Protocol commands.
    """

    if TYPE_CHECKING:
        _routing_session_handler: Optional[ConnectionHandler]
        _routing_session_id: Optional[str]
        _routing_parent_frame_id: Optional[str]

    def __init__(
        self,
        object_id: str,
        connection_handler: ConnectionHandler,
        method: Optional[str] = None,
        selector: Optional[str] = None,
        attributes_list: list[str] = [],
        mouse: Optional['MouseType'] = None,
    ):
        """
        Initialize WebElement wrapper.

        Args:
            object_id: Unique CDP object identifier for this DOM element.
            connection_handler: Connection instance for browser communication.
            method: Search method used to find this element (for debugging).
            selector: Selector string used to find this element (for debugging).
            attributes_list: Flat list of alternating attribute names and values.
            mouse: Optional Mouse instance for humanized click behavior.

        Note:
            Mouse and Keyboard follow different ownership strategies. Mouse is a shared
            instance from Tab, passed down to elements to preserve cursor position state
            across interactions. It dispatches commands through Tab._execute_command, which
            means it has no iframe context awareness. Keyboard is created per-element and
            routes commands through the element's own _execute_command, correctly handling
            iframe routing. For iframe elements, the mouse is intentionally skipped during
            humanized clicks (see click()) to avoid dispatching events to the wrong frame.
        """
        self._object_id = object_id
        self._search_method = method
        self._selector = selector
        self._connection_handler = connection_handler
        self._attributes: dict[str, str] = {}
        self._keyboard: Optional[Keyboard] = None
        self._mouse = mouse
        self._iframe_context: Optional[IFrameContext] = None
        self._iframe_resolver: Optional[IFrameContextResolver] = None
        self._def_attributes(attributes_list)
        logger.debug(
            f'WebElement initialized: object_id={self._object_id}, '
            f'method={self._search_method}, selector={self._selector}, '
            f'attributes={len(self._attributes)}'
        )

    def _get_keyboard(self) -> Keyboard:
        """Get or create the keyboard controller."""
        if self._keyboard is None:
            self._keyboard = Keyboard(self)
        return self._keyboard

    def _get_iframe_resolver(self) -> IFrameContextResolver:
        """Get or create the iframe context resolver."""
        if self._iframe_resolver is None:
            self._iframe_resolver = IFrameContextResolver(self)
        return self._iframe_resolver

    @property
    def attributes(self) -> dict[str, str]:
        """Read-only copy of the element's cached attributes."""
        return dict(self._attributes)

    @property
    def value(self) -> Optional[str]:
        """Element's value attribute (for form elements)."""
        return self._attributes.get('value')

    @property
    def class_name(self) -> Optional[str]:
        """Element's CSS class name(s)."""
        return self._attributes.get('class_name')

    @property
    def id(self) -> Optional[str]:
        """Element's ID attribute."""
        return self._attributes.get('id')

    @property
    def tag_name(self) -> Optional[str]:
        """Element's HTML tag name."""
        return self._attributes.get('tag_name')

    @property
    def is_iframe(self) -> bool:
        """Whether the element represents an iframe."""
        return self.tag_name in {'iframe', 'frame'}

    @property
    def is_enabled(self) -> bool:
        """Whether element is enabled (not disabled)."""
        return bool('disabled' not in self._attributes.keys())

    @property
    async def text(self) -> str:
        """Visible text content of the element."""
        if self._is_inside_iframe():
            response: CallFunctionOnResponse = await self.execute_script(
                'return (this.textContent || "").trim()', return_by_value=True
            )
            text_value = response.get('result', {}).get('result', {}).get('value', '') or ''
            logger.debug(f'Extracted text length (iframe ctx): {len(text_value)}')
            return text_value

        outer_html = await self.inner_html
        text_value = extract_text_from_html(outer_html, strip=True)
        logger.debug(f'Extracted text length: {len(text_value)}')
        return text_value

    @property
    async def bounds(self) -> Quad:
        """
        Element's bounding box coordinates.

        Returns coordinates in CSS pixels relative to document origin.
        """
        command = DomCommands.get_box_model(object_id=self._object_id)
        response: GetBoxModelResponse = await self._execute_command(command)
        content = response['result']['model']['content']
        logger.debug(f'Bounds retrieved (points={len(content)})')
        return content

    @property
    async def inner_html(self) -> str:
        if self.is_iframe:
            return await self._get_iframe_inner_html()

        if self._is_inside_iframe():
            response: CallFunctionOnResponse = await self.execute_script(
                'return this.outerHTML', return_by_value=True
            )
            return response.get('result', {}).get('result', {}).get('value', '')

        command = DomCommands.get_outer_html(object_id=self._object_id)
        response_get_outer_html: GetOuterHTMLResponse = await self._execute_command(command)
        return response_get_outer_html['result']['outerHTML']

    @property
    async def iframe_context(self) -> Optional[IFrameContext]:
        """
        Return the resolved iframe context for this element when it is an <iframe>.

        The context includes: frame_id, document_url, execution_context_id,
        document_object_id and, for OOPIF targets, the session_id and
        session_handler used for routing commands. The context is always freshly
        resolved to avoid stale execution contexts after iframe navigations or
        reloads. Non-iframe elements return None.

        Returns:
            IFrameContext | None: Resolved iframe context or None for non-iframes.
        """
        if not self.is_iframe:
            return None

        resolver = self._get_iframe_resolver()
        self._iframe_context = await resolver.resolve()
        self._apply_routing_from_context()
        return self._iframe_context

    def get_attribute(self, name: str) -> Optional[str]:
        """
        Get element attribute value.

        Note:
            Only provides attributes available when element was located.
            For dynamic attributes, consider using JavaScript execution.
        """
        if name == 'class' and 'class_name' in self._attributes:
            return self._attributes.get('class_name')
        return self._attributes.get(name)

    async def get_bounds_using_js(self) -> dict[str, int]:
        """
        Get element bounds using JavaScript getBoundingClientRect().

        Returns coordinates relative to viewport (alternative to bounds property).
        """
        response = await self.execute_script(Scripts.BOUNDS, return_by_value=True)
        bounds = json.loads(response['result']['result']['value'])
        logger.debug(f'Bounds via JS: {bounds}')
        return bounds

    async def get_parent_element(self) -> WebElement:
        """Element's parent element."""
        logger.debug(f'Getting parent element for object_id={self._object_id}')
        result = await self.execute_script(Scripts.GET_PARENT_NODE)
        if not self._has_object_id_key(result):
            raise ElementNotFound(f'Parent element not found for element: {self}')

        object_id = result['result']['result']['objectId']
        attributes = await self._get_object_attributes(object_id=object_id)
        logger.debug(f'Parent element resolved: object_id={object_id}')
        return WebElement(
            object_id, self._connection_handler, attributes_list=attributes, mouse=self._mouse
        )

    async def get_shadow_root(self, timeout: float = 0) -> ShadowRoot:
        """
        Get the shadow root attached to this element.

        Args:
            timeout: Maximum seconds to wait for the shadow root to appear.
                When > 0, repeatedly polls (every 0.5s) until a shadow root
                is found or the timeout expires.

        Returns:
            ShadowRoot instance for traversing the shadow DOM.

        Raises:
            ShadowRootNotFound: If no shadow root is attached (when timeout=0).
            WaitElementTimeout: If timeout > 0 and no shadow root appears
                within the specified duration.
        """
        if not timeout:
            return await self._get_shadow_root()

        start_time = asyncio.get_event_loop().time()
        while True:
            try:
                return await self._get_shadow_root()
            except ShadowRootNotFound:
                pass

            if asyncio.get_event_loop().time() - start_time > timeout:
                raise WaitElementTimeout(
                    f'Timed out after {timeout}s waiting for shadow root on element'
                )

            await asyncio.sleep(0.5)

    async def _get_shadow_root(self) -> ShadowRoot:
        """Get the shadow root attached to this element (single attempt)."""
        response: DescribeNodeResponse = await self._execute_command(
            DomCommands.describe_node(object_id=self._object_id, depth=1, pierce=True)
        )
        node_info = response.get('result', {}).get('node', {})
        shadow_roots = node_info.get('shadowRoots', [])
        if not shadow_roots:
            raise ShadowRootNotFound()

        shadow_root_data = shadow_roots[0]
        backend_node_id = shadow_root_data.get('backendNodeId')
        if not backend_node_id:
            raise ShadowRootNotFound('Shadow root found but backend node ID is unavailable')

        resolve_response: ResolveNodeResponse = await self._execute_command(
            DomCommands.resolve_node(backend_node_id=backend_node_id)
        )
        shadow_object_id = resolve_response['result']['object']['objectId']

        mode = ShadowRootType(shadow_root_data.get('shadowRootType', 'open'))

        logger.debug(f'Shadow root resolved: object_id={shadow_object_id}, mode={mode.value}')
        return ShadowRoot(
            object_id=shadow_object_id,
            connection_handler=self._connection_handler,
            mode=mode,
            host_element=self,
        )

    async def get_children_elements(
        self, max_depth: int = 1, tag_filter: list[str] = [], raise_exc: bool = False
    ) -> list[WebElement]:
        """
        Retrieve all direct and nested child elements of this element.

        Args:
            max_depth (int, optional): Maximum depth to traverse when finding children.
                Defaults to 1 for direct children only.
            tag_filter (list[str], optional): List of HTML tag names to filter results.
                If empty, returns all child elements regardless of tag. Defaults to [].

        Returns:
            list[WebElement]: List of child WebElement objects found within the specified
                depth and matching the tag filter criteria.

        Raises:
            ElementNotFound: If no child elements are found for this element and raise_exc is True.
        """
        logger.debug(
            f'Getting children: max_depth={max_depth}, '
            f'tag_filter={tag_filter}, raise_exc={raise_exc}'
        )
        children = await self._get_family_elements(
            script=Scripts.GET_CHILDREN_NODE, max_depth=max_depth, tag_filter=tag_filter
        )
        if not children and raise_exc:
            raise ElementNotFound(f'Child element not found for element: {self}')
        logger.debug(f'Children found: {len(children)}')
        return children

    async def get_siblings_elements(
        self, tag_filter: list[str] = [], raise_exc: bool = False
    ) -> list[WebElement]:
        """
        Retrieve all sibling elements of this element (elements at the same DOM level).

        Args:
            tag_filter (list[str], optional): List of HTML tag names to filter results.
                If empty, returns all sibling elements regardless of tag. Defaults to [].

        Returns:
            list[WebElement]: List of sibling WebElement objects that share the same
                parent as this element and match the tag filter criteria.

        Raises:
            ElementNotFound: If no sibling elements are found for this element
            and raise_exc is True.
        """
        logger.debug(f'Getting siblings: tag_filter={tag_filter}, raise_exc={raise_exc}')
        siblings = await self._get_family_elements(
            script=Scripts.GET_SIBLINGS_NODE, tag_filter=tag_filter
        )
        if not siblings and raise_exc:
            raise ElementNotFound(f'Sibling element not found for element: {self}')
        logger.debug(f'Siblings found: {len(siblings)}')
        return siblings

    async def take_screenshot(
        self,
        path: Optional[str | Path] = None,
        quality: int = 100,
        as_base64: bool = False,
    ) -> Optional[str]:
        """
        Capture screenshot of this element only.

        Automatically scrolls element into view before capturing.

        Args:
            path: File path for screenshot (extension determines format).
            quality: Image quality 0-100 (default 100).
            as_base64: Return as base64 string instead of saving file.

        Returns:
            Base64 screenshot data if as_base64=True, None otherwise.

        Raises:
            InvalidFileExtension: If file extension not supported.
            MissingScreenshotPath: If path is None and as_base64 is False.
        """
        if not path and not as_base64:
            raise MissingScreenshotPath()

        if path and isinstance(path, str):
            output_extension = path.split('.')[-1]
        elif path and isinstance(path, Path):
            output_extension = path.suffix.lstrip('.')
        else:
            output_extension = ScreenshotFormat.JPEG

        # Normalize jpg to jpeg (CDP only accepts jpeg)
        if output_extension == 'jpg':
            output_extension = 'jpeg'

        if not ScreenshotFormat.has_value(output_extension):
            raise InvalidFileExtension(f'{output_extension} extension is not supported.')

        file_format = ScreenshotFormat.get_value(output_extension)

        bounds = await self.get_bounds_using_js()
        clip = Viewport(
            x=bounds['x'],
            y=bounds['y'],
            width=bounds['width'],
            height=bounds['height'],
            scale=1,
        )
        logger.debug(
            f'Taking element screenshot: path={path}, quality={quality}, as_base64={as_base64}, '
            f'clip={{x: {clip["x"]}, y: {clip["y"]}, w: {clip["width"]}, h: {clip["height"]}}}'
        )

        screenshot: CaptureScreenshotResponse = await self._connection_handler.execute_command(
            PageCommands.capture_screenshot(format=file_format, clip=clip, quality=quality)
        )

        screenshot_data = screenshot['result']['data']

        if as_base64:
            logger.info('Element screenshot captured and returned as base64')
            return screenshot_data

        if path:
            image_bytes = decode_base64_to_bytes(screenshot_data)
            async with aiofiles.open(str(path), 'wb') as file:
                await file.write(image_bytes)
            logger.info(f'Element screenshot saved: {path}')

        return None

    async def scroll_into_view(self):
        """Scroll element into visible viewport."""
        command = DomCommands.scroll_into_view_if_needed(object_id=self._object_id)
        logger.info(f'Scrolling element into view: object_id={self._object_id}')
        await self._execute_command(command)

    async def wait_until(
        self,
        *,
        is_visible: bool = False,
        is_interactable: bool = False,
        timeout: int = 0,
    ):
        """Wait for element to meet specified conditions.

        Raises:
            ValueError: If neither ``is_visible`` nor ``is_interactable`` is True.
            WaitElementTimeout: If the condition is not met within ``timeout``.
        """
        checks_map = [
            (is_visible, self.is_visible),
            (is_interactable, self.is_interactable),
        ]
        checks = [func for flag, func in checks_map if flag]
        if not checks:
            raise ValueError('At least one of is_visible or is_interactable must be True')

        condition_parts = []
        if is_visible:
            condition_parts.append('visible')
        if is_interactable:
            condition_parts.append('interactable')
        condition_msg = ' and '.join(condition_parts)

        logger.info(
            f'Waiting for element: visible={is_visible}, '
            f'interactable={is_interactable}, timeout={timeout}s'
        )
        loop = asyncio.get_event_loop()
        start_time = loop.time()
        while True:
            results = await asyncio.gather(*(check() for check in checks))
            if all(results):
                logger.info(f'Element condition satisfied: {condition_msg}')
                return

            if timeout and loop.time() - start_time > timeout:
                logger.error(f'Timeout waiting for element to become {condition_msg}')
                raise WaitElementTimeout(f'Timed out waiting for element to become {condition_msg}')

            await asyncio.sleep(0.5)

    async def click_using_js(self):
        """
        Click element using JavaScript click() method.

        Raises:
            ElementNotVisible: If element is not visible.
            ElementNotInteractable: If element couldn't be clicked.

        Note:
            For <option> elements, uses specialized selection approach.
            Element is automatically scrolled into view.
        """
        if await self._is_option_element():
            return await self._click_option_tag()

        await self.scroll_into_view()

        if not await self.is_visible():
            raise ElementNotVisible()

        logger.info(f'Clicking element via JS: object_id={self._object_id}')
        result = await self.execute_script(Scripts.CLICK, return_by_value=True)
        clicked = result['result']['result']['value']
        if not clicked:
            raise ElementNotInteractable()

    async def click(
        self,
        x_offset: int = 0,
        y_offset: int = 0,
        hold_time: float = 0.1,
        humanize: bool = False,
    ):
        """
        Click element using simulated mouse events.

        Args:
            x_offset: Horizontal offset from element center.
            y_offset: Vertical offset from element center.
            hold_time: Duration to hold mouse button down (used when humanize=False).
            humanize: When True and a Mouse instance is available, uses humanized
                Bezier curve movement from the current tracked position to the
                element center before clicking. When False, dispatches raw CDP
                mousePressed/mouseReleased events directly.

        Raises:
            ElementNotVisible: If element is not visible.

        Note:
            For <option> elements, delegates to specialized JavaScript approach.
            Element is automatically scrolled into view.
        """
        if await self._is_option_element():
            return await self._click_option_tag()

        if not await self.is_visible():
            raise ElementNotVisible()

        await self.scroll_into_view()

        try:
            element_bounds = await self.bounds
            position_to_click = self._calculate_center(element_bounds)
            position_to_click = (
                position_to_click[0] + x_offset,
                position_to_click[1] + y_offset,
            )
        except KeyError:
            element_bounds_js = await self.get_bounds_using_js()
            position_to_click = (
                element_bounds_js['x'] + element_bounds_js['width'] / 2 + x_offset,
                element_bounds_js['y'] + element_bounds_js['height'] / 2 + y_offset,
            )

        has_iframe_context = getattr(self, '_iframe_context', None) is not None
        if humanize and self._mouse is not None and not has_iframe_context:
            logger.info(
                f'Clicking element (humanized): x={position_to_click[0]}, y={position_to_click[1]}'
            )
            await self._mouse.click(position_to_click[0], position_to_click[1])
            return

        logger.info(
            f'Clicking element: x={position_to_click[0]}, '
            f'y={position_to_click[1]}, hold={hold_time}s'
        )
        press_command = InputCommands.dispatch_mouse_event(
            type=MouseEventType.MOUSE_PRESSED,
            x=int(position_to_click[0]),
            y=int(position_to_click[1]),
            button=MouseButton.LEFT,
            click_count=1,
        )
        release_command = InputCommands.dispatch_mouse_event(
            type=MouseEventType.MOUSE_RELEASED,
            x=int(position_to_click[0]),
            y=int(position_to_click[1]),
            button=MouseButton.LEFT,
            click_count=1,
        )
        await self._execute_command(press_command)
        await asyncio.sleep(hold_time)
        await self._execute_command(release_command)

    async def focus(self):
        """Focus this element via CDP DOM.focus command."""
        await self._execute_command(DomCommands.focus(object_id=self._object_id))

    async def clear(self):
        """
        Clear the current value of the element.

        Supports standard inputs, textareas, and contenteditable elements.
        Dispatches ``input`` and ``change`` events so frameworks detect the update.

        Raises:
            ElementNotInteractable: If the element does not accept text input.
        """
        logger.info('Clearing element value')
        result = await self.execute_script(Scripts.CLEAR_INPUT, return_by_value=True)
        success = result['result'].get('result', {}).get('value', False)
        if not success:
            logger.error('Element does not accept text input')
            raise ElementNotInteractable('Element does not accept text input')
        if self._attributes.get('tag_name', '').lower() in {'input', 'textarea'}:
            self._attributes['value'] = ''

    async def insert_text(self, text: str):
        """
        Insert text into element using JavaScript.

        Supports standard inputs, textareas, contenteditable elements, and rich text editors.
        Inserts text at cursor position or replaces selected text.

        Args:
            text: Text to insert.

        Raises:
            ElementNotInteractable: If element does not accept text input.

        Note:
            Uses JavaScript for maximum compatibility with all input types.
            Automatically handles input/textarea and contenteditable elements.
        """
        logger.info(f'Inserting text (length={len(text)})')
        result = await self.execute_script(
            Scripts.INSERT_TEXT, return_by_value=True, arguments=[CallArgument(value=text)]
        )
        logger.debug(f'Insert text result: {result}')
        success = result['result'].get('result', {}).get('value', False)

        if not success:
            logger.error('Element does not accept text input')
            raise ElementNotInteractable('Element does not accept text input')
        # Keep cached attributes coherent for common cases (e.g., input value)
        # This avoids forcing a DOM round-trip for simple assertions.
        if self._attributes.get('tag_name', '').lower() in {'input', 'textarea'}:
            # When inserting into an empty field, resulting value equals inserted text.
            # For complex cases (non-empty with caret), tests usually check non-empty.
            self._attributes['value'] = text

    async def set_input_files(self, files: str | Path | list[str | Path]):
        """
        Set file paths for file input element.

        Args:
            files: list of absolute file paths to existing files.

        Raises:
            ElementNotAFileInput: If element is not a file input.
        """
        if (
            self._attributes.get('tag_name', '').lower() != 'input'
            or self._attributes.get('type', '').lower() != 'file'
        ):
            raise ElementNotAFileInput()
        files_list = [str(file) for file in files] if isinstance(files, list) else [str(files)]
        logger.info(f'Setting input files: count={len(files_list)}')
        await self._execute_command(
            DomCommands.set_file_input_files(files=files_list, object_id=self._object_id)
        )

    async def type_text(
        self,
        text: str,
        humanize: bool = False,
        interval: Optional[float] = None,
    ):
        """
        Type text character by character.

        Args:
            text: Text to type into the element.
            humanize: When True, simulates human-like typing.
            interval: Deprecated. Use humanize=True instead.
        """
        logger.info(f'Typing text (length={len(text)}, humanize={humanize})')
        await self.click(humanize=humanize)
        keyboard = self._get_keyboard()
        await keyboard.type_text(text, humanize=humanize, interval=interval)

    async def key_down(self, key: Key, modifiers: Optional[KeyModifier] = None):
        """
        Send key down event.

        .. deprecated::
            This method is deprecated. Use ``tab.keyboard.down()`` instead.

        Note:
            Only sends key down without release. Pair with key_up() for complete keypress.
        """
        warnings.warn(
            'WebElement.key_down() is deprecated. '
            'Use tab.keyboard API instead: await tab.keyboard.down(key, modifiers)',
            DeprecationWarning,
            stacklevel=2,
        )
        key_name, code = key
        logger.info(f'Key down: key={key_name} code={code} modifiers={modifiers}')
        await self._execute_command(
            InputCommands.dispatch_key_event(
                type=KeyEventType.KEY_DOWN,
                key=key_name,
                windows_virtual_key_code=code,
                native_virtual_key_code=code,
                modifiers=modifiers,
            )
        )

    async def key_up(self, key: Key):
        """
        Send key up event (should follow corresponding key_down()).

        .. deprecated::
            This method is deprecated. Use ``tab.keyboard.up()`` instead.
        """
        warnings.warn(
            'WebElement.key_up() is deprecated. '
            'Use tab.keyboard API instead: await tab.keyboard.up(key)',
            DeprecationWarning,
            stacklevel=2,
        )
        key_name, code = key
        logger.info(f'Key up: key={key_name} code={code}')
        await self._execute_command(
            InputCommands.dispatch_key_event(
                type=KeyEventType.KEY_UP,
                key=key_name,
                windows_virtual_key_code=code,
                native_virtual_key_code=code,
            )
        )

    async def press_keyboard_key(
        self,
        key: Key,
        modifiers: Optional[KeyModifier] = None,
        interval: float = 0.1,
    ):
        """
        Press and release keyboard key with configurable timing.

        .. deprecated::
            This method is deprecated. Use ``tab.keyboard.press()`` instead.

        Better for special keys (Enter, Tab, etc.) than type_text().
        """
        warnings.warn(
            'WebElement.press_keyboard_key() is deprecated. '
            'Use tab.keyboard API instead: await tab.keyboard.press(key, modifiers, interval)',
            DeprecationWarning,
            stacklevel=2,
        )
        await self.key_down(key, modifiers)
        await asyncio.sleep(interval)
        await self.key_up(key)

    async def is_editable(self) -> bool:
        """
        Check if element can accept text input.

        Returns:
            True if element is editable (input, textarea, or contenteditable).
        """
        result = await self.execute_script(Scripts.IS_EDITABLE, return_by_value=True)
        is_editable = result['result']['result']['value']
        logger.debug(f'Element editable check: {is_editable}')
        return is_editable

    async def is_visible(self):
        """Check if element is visible using comprehensive JavaScript visibility test."""
        result = await self.execute_script(Scripts.ELEMENT_VISIBLE, return_by_value=True)
        if 'error' in result:
            return False
        return bool(result.get('result', {}).get('result', {}).get('value', False))

    async def is_on_top(self):
        """Check if element is topmost at its center point (not covered by overlays)."""
        result = await self.execute_script(Scripts.ELEMENT_ON_TOP, return_by_value=True)
        if 'error' in result:
            return False
        return bool(result.get('result', {}).get('result', {}).get('value', False))

    async def is_interactable(self):
        """Check if element is interactable based on visibility and position."""
        result = await self.execute_script(Scripts.ELEMENT_INTERACTIVE, return_by_value=True)
        if 'error' in result:
            return False
        return bool(result.get('result', {}).get('result', {}).get('value', False))

    async def execute_script(
        self,
        script: str,
        *,
        arguments: Optional[list[CallArgument]] = None,
        silent: Optional[bool] = None,
        return_by_value: Optional[bool] = None,
        generate_preview: Optional[bool] = None,
        user_gesture: Optional[bool] = None,
        await_promise: Optional[bool] = None,
        execution_context_id: Optional[int] = None,
        object_group: Optional[str] = None,
        throw_on_side_effect: Optional[bool] = None,
        unique_context_id: Optional[str] = None,
        serialization_options: Optional[SerializationOptions] = None,
    ) -> CallFunctionOnResponse:
        """
        Execute JavaScript in element context.

        Args:
            script (str): JavaScript code to execute. Use 'this' to reference this element.
            arguments (Optional[list[CallArgument]]): Arguments to pass to the function
                (Runtime.callFunctionOn).
            silent (Optional[bool]): Whether to silence exceptions (Runtime.callFunctionOn).
            return_by_value (Optional[bool]): Whether to return the result by value instead of
                reference (Runtime.callFunctionOn).
            generate_preview (Optional[bool]): Whether to generate a preview for the result
                (Runtime.callFunctionOn).
            user_gesture (Optional[bool]): Whether to treat the call as initiated by user
                gesture (Runtime.callFunctionOn).
            await_promise (Optional[bool]): Whether to await promise result
                (Runtime.callFunctionOn).
            execution_context_id (Optional[int]): ID of the execution context to call the
                function in (Runtime.callFunctionOn).
            object_group (Optional[str]): Symbolic group name for the result
                (Runtime.callFunctionOn).
            throw_on_side_effect (Optional[bool]): Whether to throw if side effect cannot be
                ruled out (Runtime.callFunctionOn).
            unique_context_id (Optional[str]): Unique context ID for the function call
                (Runtime.callFunctionOn).
            serialization_options (Optional[SerializationOptions]): Serialization options for
                the result (Runtime.callFunctionOn).

        Returns:
            CallFunctionOnResponse: The result of the script execution.

        Examples:
            # Click the element
            await element.execute_script('this.click()')

            # Modify element style
            await element.execute_script('this.style.border = "2px solid red"')

            # Get element text
            result = await element.execute_script('return this.textContent', return_by_value=True)

            # Set element content
            await element.execute_script('this.textContent = "Hello World"')
        """
        if not is_script_already_function(script):
            script = f'function(){{ {script} }}'

        logger.debug(
            f'Executing script on element: return_by_value={return_by_value}, '
            f'length={len(script)}, args={len(arguments) if arguments else 0}'
        )
        command = RuntimeCommands.call_function_on(
            function_declaration=script,
            object_id=self._object_id,
            arguments=arguments,
            silent=silent,
            return_by_value=return_by_value,
            generate_preview=generate_preview,
            user_gesture=user_gesture,
            await_promise=await_promise,
            execution_context_id=execution_context_id,
            object_group=object_group,
            throw_on_side_effect=throw_on_side_effect,
            unique_context_id=unique_context_id,
            serialization_options=serialization_options,
        )
        return await self._execute_command(command)

    def __repr__(self):
        """String representation showing attributes and object ID."""
        attrs = ', '.join(f'{k}={v!r}' for k, v in self._attributes.items())
        return f'{self.__class__.__name__}({attrs})(object_id={self._object_id})'

    def _is_inside_iframe(self) -> bool:
        """Check if this element is inside an iframe context (not the iframe itself)."""
        return self._iframe_context is not None and not self.is_iframe

    async def _get_iframe_inner_html(self) -> str:
        """Get inner HTML of an iframe element."""
        iframe_context = await self.iframe_context
        if iframe_context is None:
            raise InvalidIFrame('Unable to resolve iframe context')
        response: EvaluateResponse = await self._execute_command(
            RuntimeCommands.evaluate(
                expression='document.documentElement.outerHTML',
                context_id=iframe_context.execution_context_id,
                return_by_value=True,
            )
        )
        return response['result']['result'].get('value', '')

    def _apply_routing_from_context(self) -> None:
        """Apply routing attributes from iframe context.

        After iframe context resolution, commands targeting the *content* of
        the iframe should route through ``_iframe_context`` (handled by
        ``_resolve_routing`` which prioritises ``_iframe_context`` over
        ``_routing_session_*``).

        The ``_routing_session_handler`` / ``_routing_session_id`` attributes
        must be preserved: they identify the parent OOPIF session where the
        ``<iframe>`` *element itself* lives.  The resolver needs them to
        re-describe the element on subsequent re-resolutions.
        """

    async def _click_option_tag(self):
        """Specialized method for clicking <option> elements in dropdowns."""
        await self._execute_command(
            RuntimeCommands.call_function_on(
                object_id=self._object_id,
                function_declaration=Scripts.CLICK_OPTION_TAG,
                return_by_value=True,
            )
        )

    async def _get_family_elements(
        self, script: str, max_depth: int = 1, tag_filter: list[str] = []
    ) -> list[WebElement]:
        """
        Retrieve all family elements of this element (elements at the same DOM level).

        Args:
            script (str): CDP script to execute for retrieving family elements.
            tag_filter (list[str], optional): List of HTML tag names to filter results.
                If empty, returns all family elements regardless of tag. Defaults to [].

        Returns:
            list[WebElement]: List of family WebElement objects that share the same
                parent as this element and match the tag filter criteria.
        """
        result = await self.execute_script(
            script.format(tag_filter=tag_filter, max_depth=max_depth)
        )
        if not self._has_object_id_key(result):
            return []

        array_object_id = result['result']['result']['objectId']

        get_properties_command = RuntimeCommands.get_properties(object_id=array_object_id)
        properties_response: GetPropertiesResponse = await self._execute_command(
            get_properties_command
        )

        family_elements: list[WebElement] = []
        for prop in properties_response['result']['result']:
            if not (prop['name'].isdigit() and 'objectId' in prop['value']):
                continue
            child_object_id = prop['value']['objectId']
            attributes = await self._get_object_attributes(object_id=child_object_id)
            family_elements.append(
                WebElement(
                    child_object_id,
                    self._connection_handler,
                    attributes_list=attributes,
                    mouse=self._mouse,
                )
            )

        logger.debug(f'Family elements found: {len(family_elements)}')
        return family_elements

    def _def_attributes(self, attributes_list: list[str]):
        """Process flat attribute list into dictionary (renames 'class' to 'class_name')."""
        for i in range(0, len(attributes_list), 2):
            key = attributes_list[i]
            key = key if key != 'class' else 'class_name'
            value = attributes_list[i + 1]
            self._attributes[key] = value
        logger.debug(f'Attributes defined: count={len(self._attributes)}')

    def _is_option_tag(self):
        """Check if element is an <option> tag."""
        return self._attributes.get('tag_name', '').lower() == 'option'

    async def _is_option_element(self) -> bool:
        """
        Robust check for <option> elements, falling back to JS when tag_name is missing.
        """
        tag = self._attributes.get('tag_name', '')
        if tag:
            return tag.lower() == 'option'

        # Heuristic from original selector/method
        selector = str(getattr(self, '_selector', '') or '')
        method_raw = getattr(self, '_search_method', '')
        method = str(getattr(method_raw, 'value', method_raw) or '').lower()
        if method == 'tag_name' and selector.lower() == 'option':
            return True
        if method == 'xpath' and 'option' in selector.lower():
            return True

        result = await self.execute_script(Scripts.IS_OPTION_TAG, return_by_value=True)
        is_option = result.get('result', {}).get('result', {}).get('value', False)
        if is_option and not self._attributes.get('tag_name'):
            self._attributes['tag_name'] = 'option'
        return bool(is_option)

    @staticmethod
    def _calculate_center(bounds: list) -> tuple:
        """Calculate center point from bounding box coordinates."""
        x_values = [bounds[i] for i in range(0, len(bounds), 2)]
        y_values = [bounds[i] for i in range(1, len(bounds), 2)]
        x_center = sum(x_values) / len(x_values)
        y_center = sum(y_values) / len(y_values)
        return x_center, y_center


================================================
FILE: pydoll/exceptions.py
================================================
"""
Pydoll Exception Classes

This module contains all exception classes used throughout the Pydoll library,
organized into logical categories based on their function and usage patterns.
Each category uses a base class to provide common functionality for related exceptions.
"""


class PydollException(Exception):
    """Base class for all Pydoll exceptions."""

    message = 'An error occurred in Pydoll'

    def __init__(self, message: str = ''):
        self.message = message or self.message

    def __str__(self):
        return self.message


class ConnectionException(PydollException):
    """Base class for exceptions related to browser connection."""

    message = 'A connection error occurred'


class ConnectionFailed(ConnectionException):
    """Raised when connection to the browser cannot be established."""

    message = 'Failed to connect to the browser'


class ReconnectionFailed(ConnectionException):
    """Raised when an attempt to reconnect to the browser fails."""

    message = 'Failed to reconnect to the browser'


class WebSocketConnectionClosed(ConnectionException):
    """Raised when the WebSocket connection to the browser is closed unexpectedly."""

    message = 'The WebSocket connection is closed'


class NetworkError(ConnectionException):
    """Raised when a general network error occurs during browser communication."""

    message = 'A network error occurred'


class BrowserException(PydollException):
    """Base class for exceptions related to browser process management."""

    message = 'A browser error occurred'


class BrowserNotRunning(BrowserException):
    """Raised when attempting to interact with a browser that is not running."""

    message = 'The browser is not running'


class FailedToStartBrowser(BrowserException):
    """Raised when the browser process cannot be started."""

    message = 'Failed to start the browser'


class UnsupportedOS(BrowserException):
    """Raised when attempting to run on an unsupported operating system."""

    message = 'Unsupported OS'


class NoValidTabFound(BrowserException):
    """Raised when no valid browser tab can be found or created."""

    message = 'No valid attached tab found'


class InvalidConnectionPort(BrowserException):
    """Raised when an invalid (non-positive) connection port is provided."""

    message = 'Connection port must be a positive integer'


class InvalidWebSocketAddress(BrowserException):
    """Raised when an invalid WebSocket address is provided or required but missing."""

    message = 'Invalid WebSocket address'


class MissingTargetOrWebSocket(BrowserException):
    """Raised when a Tab has neither target ID nor WebSocket address available."""

    message = 'Tab has no target ID or WebSocket address'


class ProtocolException(PydollException):
    """Base class for exceptions related to CDP protocol communication."""

    message = 'A protocol error occurred'


class TopLevelTargetRequired(ProtocolException):
    """Raised when a command can only be executed on top-level targets."""

    message = 'Command can only be executed on top-level targets.'


class InvalidCommand(ProtocolException):
    """Raised when an invalid command is sent to the browser."""

    message = 'The command provided is invalid'


class InvalidResponse(ProtocolException):
    """Raised when an invalid response is received from the browser."""

    message = 'The response received is invalid'


class ResendCommandFailed(ProtocolException):
    """Raised when an attempt to resend a failed command fails."""

    message = 'Failed to resend the command'


class CommandExecutionTimeout(ProtocolException):
    """Raised when a command execution times out."""

    message = 'The command execution timed out'


class InvalidCallback(ProtocolException):
    """Raised when an invalid callback is provided for an event."""

    message = 'The callback provided is invalid'


class EventNotSupported(ProtocolException):
    """Raised when an attempt is made to subscribe to an unsupported event."""

    message = 'The event is not supported'


class ElementException(PydollException):
    """Base class for exceptions related to element interactions."""

    message = 'An element interaction error occurred'


class ElementNotFound(ElementException):
    """Raised when an element cannot be found in the DOM."""

    message = 'The specified element was not found'


class ElementNotVisible(ElementException):
    """Raised when attempting to interact with an element that is not visible."""

    message = 'The element is not visible'


class ElementNotInteractable(ElementException):
    """Raised when attempting to interact with an element that cannot receive interaction."""

    message = 'The element is not interactable'


class ClickIntercepted(ElementException):
    """Raised when a click operation is intercepted by another element."""

    message = 'The click was intercepted'


class ElementNotAFileInput(ElementException):
    """Raised when attempting to use file input methods on a non-file input element."""

    message = 'The element is not a file input'


class ShadowRootNotFound(ElementException):
    """Raised when an element does not have an attached shadow root."""

    message = 'No shadow root attached to this element'


class TimeoutException(PydollException):
    """Base class for exceptions related to timeouts."""

    message = 'A timeout occurred'


class PageLoadTimeout(TimeoutException):
    """Raised when a page load operation times out."""

    message = 'Page load timed out'


class WaitElementTimeout(TimeoutException):
    """Raised when waiting for an element times out."""

    message = 'Timed out waiting for element to appear'


class DownloadTimeout(TimeoutException):
    """Raised when waiting for a file download to complete times out."""

    message = 'Timed out waiting for download to complete'


class ConfigurationException(PydollException):
    """Base class for exceptions related to configuration and options."""

    message = 'A configuration error occurred'


class InvalidOptionsObject(ConfigurationException):
    """Raised when an invalid options object is provided."""

    message = 'The options object provided is invalid'


class InvalidBrowserPath(ConfigurationException):
    """Raised when an invalid browser executable path is provided."""

    message = 'The browser path provided is invalid'


class ArgumentAlreadyExistsInOptions(ConfigurationException):
    """Raised when attempting to add a duplicate argument to browser options."""

    message = 'The argument already exists in the options'


class ArgumentNotFoundInOptions(ConfigurationException):
    """Raised when attempting to remove an argument that does not exist in browser options."""

    message = 'The argument does not exist in the options'


class InvalidFileExtension(ConfigurationException):
    """Raised when an unsupported file extension is provided."""

    message = 'The file extension provided is not supported'


class InvalidTabInitialization(ConfigurationException):
    """Raised when creating a Tab without connection_port, target_id or ws_address."""

    message = 'Either connection_port, target_id, or ws_address must be provided'


class MissingScreenshotPath(ConfigurationException):
    """Raised when take_screenshot is called without path and not returning base64."""

    message = 'path is required when as_base64 is False'


class DialogException(PydollException):
    """Base class for exceptions related to browser dialogs."""

    message = 'A dialog error occurred'


class NoDialogPresent(DialogException):
    """Raised when attempting to interact with a dialog that doesn't exist."""

    message = 'No dialog present on the page'


class NotAnIFrame(PydollException):
    """Raised when an element is not an iframe."""

    message = 'The element is not an iframe'


class InvalidIFrame(PydollException):
    """Raised when an iframe is not valid."""

    message = 'The iframe is not valid'


class IFrameNotFound(PydollException):
    """Raised when an iframe is not found."""

    message = 'The iframe was not found'


class NetworkEventsNotEnabled(PydollException):
    """Raised when network events are not enabled."""

    message = 'Network events not enabled'


class RequestException(PydollException):
    """Base class for exceptions related to HTTP requests."""

    message = 'An HTTP request error occurred'


class HTTPError(RequestException):
    """Exception raised for HTTP error responses (4xx and 5xx status codes)."""

    message = 'An HTTP error occurred'


class HarRecordingError(RequestException):
    """Raised when HAR recording fails."""

    message = 'HAR recording error occurred'


class ScriptException(PydollException):
    """Base class for exceptions related to JavaScript execution."""

    message = 'A script execution error occurred'


class InvalidScriptWithElement(ScriptException):
    """Raised when a script contains 'argument' but no element is provided."""

    message = 'Script contains "argument" but no element was provided'


class WrongPrefsDict(PydollException):
    """Raised when the prefs dict provided contains the 'prefs' key"""

    message = 'The dict can not contain "prefs" key, provide only the prefs options'


class ElementPreconditionError(ElementException):
    """Raised when invalid or missing preconditions are provided for element operations."""

    message = 'Invalid element preconditions'


================================================
FILE: pydoll/interactions/__init__.py
================================================
from pydoll.constants import DEFAULT_TYPO_PROBABILITY, TypoType
from pydoll.interactions.iframe import IFrameContext, IFrameContextResolver
from pydoll.interactions.keyboard import (
    Keyboard,
    KeyboardAPI,
    TimingConfig,
    TypoConfig,
    TypoResult,
)
from pydoll.interactions.mouse import Mouse, MouseAPI, MouseTimingConfig
from pydoll.interactions.scroll import Scroll, ScrollAPI, ScrollTimingConfig

__all__ = [
    'DEFAULT_TYPO_PROBABILITY',
    'IFrameContext',
    'IFrameContextResolver',
    'Keyboard',
    'KeyboardAPI',
    'Mouse',
    'MouseAPI',
    'MouseTimingConfig',
    'Scroll',
    'ScrollAPI',
    'ScrollTimingConfig',
    'TimingConfig',
    'TypoConfig',
    'TypoResult',
    'TypoType',
]


================================================
FILE: pydoll/interactions/iframe.py
================================================
from __future__ import annotations

import logging
from dataclasses import dataclass
from typing import TYPE_CHECKING, Iterable, Optional

from pydoll.commands import DomCommands, PageCommands, RuntimeCommands, TargetCommands
from pydoll.connection import ConnectionHandler
from pydoll.exceptions import InvalidIFrame
from pydoll.protocol.dom.methods import DescribeNodeResponse, GetFrameOwnerResponse
from pydoll.protocol.dom.types import Node
from pydoll.protocol.page.methods import CreateIsolatedWorldResponse, GetFrameTreeResponse
from pydoll.protocol.page.types import Frame, FrameTree
from pydoll.protocol.runtime.methods import EvaluateResponse
from pydoll.protocol.target.methods import AttachToTargetResponse, GetTargetsResponse

if TYPE_CHECKING:
    from pydoll.elements.web_element import WebElement

logger = logging.getLogger(__name__)


@dataclass
class IFrameContext:
    """Context information for an iframe element."""

    frame_id: str
    document_url: Optional[str] = None
    execution_context_id: Optional[int] = None
    document_object_id: Optional[str] = None
    session_handler: Optional[ConnectionHandler] = None
    session_id: Optional[str] = None


class IFrameContextResolver:
    """Resolves iframe context for WebElement."""

    def __init__(self, element: WebElement):
        self._element = element

    async def resolve(self) -> IFrameContext:
        """
        Resolve and return iframe context.

        Returns:
            IFrameContext with frame_id, document_url, execution_context_id,
            document_object_id and session info for OOPIF targets.

        Raises:
            InvalidIFrame: If unable to resolve the iframe context.
        """
        base_handler, base_session_id = self._get_base_session()
        node_info = await self._describe_element_node(base_handler, base_session_id)
        frame_id, document_url, content_frame_id, backend_node_id = (
            self._extract_frame_metadata(node_info)
        )

        if not frame_id and backend_node_id is not None:
            frame_id, document_url = await self._resolve_frame_by_owner(
                base_handler, base_session_id, backend_node_id, document_url
            )

        session_handler, session_id, frame_id, document_url = await self._resolve_oopif_if_needed(
            frame_id,
            content_frame_id,
            backend_node_id,
            current_document_url=document_url,
            base_handler=base_handler,
            base_session_id=base_session_id,
        )

        if not frame_id:
            raise InvalidIFrame('Unable to resolve frameId for the iframe element')

        context = IFrameContext(frame_id=frame_id, document_url=document_url)

        if session_handler and session_id:
            context.session_handler = session_handler
            context.session_id = session_id

        effective_handler = session_handler or base_handler
        effective_session_id = session_id or base_session_id

        execution_context_id = await self._create_isolated_world_for_frame(
            frame_id, effective_handler, effective_session_id
        )
        context.execution_context_id = execution_context_id

        document_object_id = await self._get_document_object_id(execution_context_id, context)
        context.document_object_id = document_object_id

        return context

    def _get_base_session(self) -> tuple[ConnectionHandler, Optional[str]]:
        """Return the default handler and session id for routing commands."""
        handler = (
            getattr(self._element, '_routing_session_handler', None)
            or self._element._connection_handler
        )
        session_id = getattr(self._element, '_routing_session_id', None)
        return handler, session_id

    async def _describe_element_node(
        self,
        handler: ConnectionHandler,
        session_id: Optional[str],
    ) -> Node:
        """Describe the iframe element using the given handler/session.

        This bypasses ``_resolve_routing()`` which, after a previous
        resolution, may return the iframe *content* session instead of
        the parent session where the element actually lives.
        """
        command = DomCommands.describe_node(object_id=self._element._object_id)
        if session_id:
            command['sessionId'] = session_id
        response: DescribeNodeResponse = await handler.execute_command(command)
        if 'error' in response:
            return {}
        return response.get('result', {}).get('node', {})

    @staticmethod
    def _extract_frame_metadata(
        node_info: Node,
    ) -> tuple[Optional[str], Optional[str], Optional[str], Optional[int]]:
        """Extract iframe-related metadata from DOM node info.

        Returns:
            Tuple of (frame_id, document_url, content_frame_id, backend_node_id).
            ``content_frame_id`` is the frame ID of the frame *created* by the
            ``<iframe>`` element (``node_info['frameId']`` on frame-owner
            elements).  For same-origin iframes it equals
            ``contentDocument.frameId``; for OOPIFs ``contentDocument`` is
            absent but ``content_frame_id`` is still set by the browser.
        """
        content_document = node_info.get('contentDocument') or {}
        content_frame_id = node_info.get('frameId')
        backend_node_id = node_info.get('backendNodeId')
        frame_id = content_document.get('frameId')
        document_url = (
            content_document.get('documentURL')
            or content_document.get('baseURL')
            or node_info.get('documentURL')
            or node_info.get('baseURL')
        )
        return frame_id, document_url, content_frame_id, backend_node_id

    async def _resolve_frame_by_owner(
        self,
        base_handler: ConnectionHandler,
        base_session_id: Optional[str],
        backend_node_id: int,
        current_document_url: Optional[str],
    ) -> tuple[Optional[str], Optional[str]]:
        """Resolve frame id and URL by matching owner backend_node_id."""
        owner_frame_id, owner_url = await self._find_frame_by_owner(
            base_handler, base_session_id, backend_node_id
        )
        if not owner_frame_id:
            return None, current_document_url
        return owner_frame_id, owner_url or current_document_url

    async def _find_frame_by_owner(
        self,
        handler: ConnectionHandler,
        session_id: Optional[str],
        backend_node_id: int,
    ) -> tuple[Optional[str], Optional[str]]:
        """Find frame by matching owner backend_node_id."""
        frame_tree = await self._get_frame_tree_for(handler, session_id)
        for frame_node in self._walk_frames(frame_tree):
            candidate_frame_id = frame_node.get('id', '')
            if not candidate_frame_id:
                continue
            owner_backend_id = await self._owner_backend_for(
                handler, session_id, candidate_frame_id
            )
            if owner_backend_id == backend_node_id:
                return candidate_frame_id, frame_node.get('url')
        return None, None

    @staticmethod
    async def _get_frame_tree_for(
        handler: ConnectionHandler,
        session_id: Optional[str],
    ) -> FrameTree:
        """Get Page frame tree for the given connection/target."""
        command = PageCommands.get_frame_tree()
        if session_id:
            command['sessionId'] = session_id
        response: GetFrameTreeResponse = await handler.execute_command(command)
        return response['result']['frameTree']

    @staticmethod
    def _walk_frames(tree: FrameTree) -> Iterable[Frame]:
        """Recursively traverse FrameTree and collect all frame descriptors."""
        if not tree:
            return []
        frames: list[Frame] = [tree['frame']]
        for child_frame in tree.get('childFrames', []) or []:
            frames.extend(IFrameContextResolver._walk_frames(child_frame))
        return [frame_node for frame_node in frames if frame_node]

    @staticmethod
    async def _owner_backend_for(
        handler: ConnectionHandler,
        session_id: Optional[str],
        frame_id: str,
    ) -> Optional[int]:
        """Get backendNodeId of the DOM element that owns the given frame."""
        command = DomCommands.get_frame_owner(frame_id=frame_id)
        if session_id:
            command['sessionId'] = session_id
        response: GetFrameOwnerResponse = await handler.execute_command(command)
        return response.get('result', {}).get('backendNodeId')

    async def _resolve_oopif_if_needed(
        self,
        current_frame_id: Optional[str],
        content_frame_id: Optional[str],
        backend_node_id: Optional[int],
        current_document_url: Optional[str],
        base_handler: Optional[ConnectionHandler] = None,
        base_session_id: Optional[str] = None,
    ) -> tuple[Optional[ConnectionHandler], Optional[str], Optional[str], Optional[str]]:
        """Resolve OOPIF and routing when needed."""
        if not content_frame_id or (current_frame_id and backend_node_id is None):
            return None, None, current_frame_id, current_document_url

        (
            session_handler,
            session_id,
            resolved_frame_id,
            resolved_url,
        ) = await self._resolve_oopif_by_parent(
            content_frame_id, backend_node_id, base_handler, base_session_id
        )

        if session_handler and session_id and resolved_url:
            return (
                session_handler,
                session_id,
                resolved_frame_id or current_frame_id,
                resolved_url or current_document_url,
            )

        return (
            None,
            None,
            current_frame_id or resolved_frame_id,
            current_document_url or resolved_url,
        )

    async def _resolve_oopif_by_parent(
        self,
        content_frame_id: str,
        backend_node_id: Optional[int],
        base_handler: Optional[ConnectionHandler] = None,
        base_session_id: Optional[str] = None,
    ) -> tuple[Optional[ConnectionHandler], Optional[str], Optional[str], Optional[str]]:
        """Resolve out-of-process iframe using content frame id.

        ``content_frame_id`` is the frame ID of the frame *created* by the
        ``<iframe>`` element (obtained from ``DOM.describeNode``'s
        ``node.frameId``).  For OOPIF targets the root frame of the target
        shares this ID, so we can match directly without needing
        ``DOM.getFrameOwner``.

        When a direct frame-ID match is not possible (e.g. nested sub-frames
        inside the OOPIF), the method falls back to ``DOM.getFrameOwner``
        using the routing handler/session that has DOM visibility into the
        parent context.
        """
        browser_handler = ConnectionHandler(
            connection_port=self._element._connection_handler._connection_port
        )
        targets_response: GetTargetsResponse = await browser_handler.execute_command(
            TargetCommands.get_targets()
        )
        target_infos = targets_response.get('result', {}).get('targetInfos', [])

        # The handler/session that can resolve DOM.getFrameOwner for the
        # element's context.  When the <iframe> lives inside a nested OOPIF
        # the Tab-level handler has no visibility; we must route through the
        # session that originally found the element.
        owner_handler = base_handler or self._element._connection_handler
        owner_session_id = base_session_id

        direct_children = [
            target_info
            for target_info in target_infos
            if target_info.get('type') in {'iframe', 'page'}
            and target_info.get('parentFrameId') == content_frame_id
        ]

        is_single_child = len(direct_children) == 1
        for child_target in direct_children:
            attach_response: AttachToTargetResponse = await browser_handler.execute_command(
                TargetCommands.attach_to_target(target_id=child_target['targetId'], flatten=True)
            )
            attached_session_id = attach_response.get('result', {}).get('sessionId')
            if not attached_session_id:
                continue

            frame_tree = await self._get_frame_tree_for(browser_handler, attached_session_id)
            root_frame = (frame_tree or {}).get('frame', {})
            root_frame_id = root_frame.get('id', '')

            if is_single_child and root_frame_id and backend_node_id is None:
                return (
                    browser_handler,
                    attached_session_id,
                    root_frame_id,
                    root_frame.get('url'),
                )

            if root_frame_id and backend_node_id is not None:
                owner_backend_id = await self._owner_backend_for(
                    owner_handler, owner_session_id, root_frame_id
                )
                if owner_backend_id == backend_node_id:
                    return (
                        browser_handler,
                        attached_session_id,
                        root_frame_id,
                        root_frame.get('url'),
                    )

        for target_info in target_infos:
            if target_info.get('type') not in {'iframe', 'page'}:
                continue
            attach_response = await browser_handler.execute_command(
                TargetCommands.attach_to_target(
                    target_id=target_info.get('targetId', ''), flatten=True
                )
            )
            attached_session_id = attach_response.get('result', {}).get('sessionId')
            if not attached_session_id:
                continue

            frame_tree = await self._get_frame_tree_for(browser_handler, attached_session_id)
            root_frame = (frame_tree or {}).get('frame', {})
            root_frame_id = root_frame.get('id', '')

            # Direct match: the <iframe> element's frameId (content_frame_id)
            # equals this target's root frame ID.  This handles nested OOPIFs
            # where DOM.getFrameOwner cannot be resolved through the main
            # page handler.
            if root_frame_id and root_frame_id == content_frame_id:
                return (
                    browser_handler,
                    attached_session_id,
                    root_frame_id,
                    root_frame.get('url'),
                )

            if root_frame_id and backend_node_id is not None:
                owner_backend_id = await self._owner_backend_for(
                    owner_handler, owner_session_id, root_frame_id
                )
                if owner_backend_id == backend_node_id:
                    return (
                        browser_handler,
                        attached_session_id,
                        root_frame_id,
                        root_frame.get('url'),
                    )

            child_frame_id = self._find_child_by_parent(frame_tree, content_frame_id)
            if child_frame_id:
                return browser_handler, attached_session_id, child_frame_id, None

        return None, None, None, None

    @staticmethod
    def _find_child_by_parent(tree: FrameTree, parent_id: str) -> Optional[str]:
        """Find id of child frame whose parentId equals the given one."""
        if not tree:
            return None
        for child in tree.get('childFrames', []) or []:
            child_frame = child.get('frame', {})
            if child_frame.get('parentId') == parent_id:
                return child_frame.get('id')
            found = IFrameContextResolver._find_child_by_parent(child, parent_id)
            if found:
                return found
        return None

    @staticmethod
    async def _create_isolated_world_for_frame(
        frame_id: str,
        handler: ConnectionHandler,
        session_id: Optional[str],
    ) -> int:
        """Create isolated world for the given frame."""
        create_command = PageCommands.create_isolated_world(
            frame_id=frame_id,
            world_name=f'pydoll::iframe::{frame_id}',
            grant_universal_access=True,
        )
        if session_id:
            create_command['sessionId'] = session_id
        create_response: CreateIsolatedWorldResponse = await handler.execute_command(create_command)
        execution_context_id = create_response.get('result', {}).get('executionContextId')
        if not execution_context_id:
            raise InvalidIFrame('Unable to create isolated world for iframe')
        return execution_context_id

    async def _get_document_object_id(
        self,
        execution_context_id: int,
        context: IFrameContext,
    ) -> str:
        """Get document.documentElement object id in iframe context."""
        evaluate_command = RuntimeCommands.evaluate(
            expression='document.documentElement',
            context_id=execution_context_id,
        )
        if context.session_id:
            evaluate_command['sessionId'] = context.session_id

        handler = context.session_handler or self._element._connection_handler
        evaluate_response: EvaluateResponse = await handler.execute_command(evaluate_command)

        result_object = evaluate_response.get('result', {}).get('result', {})
        document_object_id = result_object.get('objectId')
        if not document_object_id:
            raise InvalidIFrame('Unable to obtain document reference for iframe')
        return document_object_id


================================================
FILE: pydoll/interactions/keyboard.py
================================================
from __future__ import annotations

import asyncio
import logging
import random
import warnings
from dataclasses import dataclass
from typing import Any, Optional, Protocol, cast

from pydoll.commands import InputCommands
from pydoll.constants import (
    CHAR_TO_KEY_INFO,
    DEFAULT_TYPO_PROBABILITY,
    QWERTY_NEIGHBORS,
    Key,
    TypoType,
)
from pydoll.protocol.input.types import KeyEventType, KeyModifier

logger = logging.getLogger(__name__)


class CommandExecutor(Protocol):
    """Protocol for objects that can execute CDP commands."""

    async def _execute_command(self, command: Any) -> Any: ...


@dataclass(frozen=True)
class TypoResult:
    """Result of a typo generation."""

    typo_type: TypoType
    wrong_char: str = ''


@dataclass(frozen=True)
class TimingConfig:
    """Configuration for realistic typing timing."""

    keystroke_min: float = 0.03
    keystroke_max: float = 0.12
    punctuation_min: float = 0.08
    punctuation_max: float = 0.18
    thinking_probability: float = 0.02
    thinking_min: float = 0.3
    thinking_max: float = 0.7
    distraction_probability: float = 0.005
    distraction_min: float = 0.5
    distraction_max: float = 1.2
    mistake_realize_min: float = 0.1
    mistake_realize_max: float = 0.25
    after_correction_min: float = 0.03
    after_correction_max: float = 0.08
    double_press_min: float = 0.02
    double_press_max: float = 0.05
    hesitation_min: float = 0.15
    hesitation_max: float = 0.3


@dataclass(frozen=True)
class TypoConfig:
    """Configuration for typo generation weights."""

    adjacent_weight: float = 0.55
    transpose_weight: float = 0.20
    double_weight: float = 0.12
    skip_weight: float = 0.08
    missed_space_weight: float = 0.05


class Keyboard:
    """
    Keyboard input controller for Tab and WebElement.

    Provides methods for:
    - Tab: Public keyboard simulation (press, down, up, hotkey)
    - WebElement: Private text typing with optional humanization
    """

    PAUSE_CHARS = frozenset(' .,!?;:\n')

    def __init__(
        self,
        executor: CommandExecutor,
        timing: Optional[TimingConfig] = None,
        typo_config: Optional[TypoConfig] = None,
    ):
        """
        Initialize keyboard controller.

        Args:
            executor: Object with _execute_command method (Tab or WebElement).
            timing: Optional custom timing configuration.
            typo_config: Optional custom typo weights configuration.
        """
        self._executor = executor
        self._timing = timing or TimingConfig()
        self._typo_config = typo_config or TypoConfig()
        self._has_focus = hasattr(executor, 'focus')

    async def _ensure_focus(self):
        """Re-focus the executor element before a keystroke if it supports focus."""
        if self._has_focus:
            await self._executor.focus()

    async def press(
        self,
        key: Key,
        modifiers: Optional[KeyModifier] = None,
        interval: float = 0.1,
    ):
        """
        Press and release a key (down + wait + up).

        Args:
            key: Key to press (from Key enum).
            modifiers: Optional key modifiers (Alt=1, Ctrl=2, Meta=4, Shift=8).
            interval: Time to hold the key down in seconds.

        Example:
            await tab.keyboard.press(Key.ENTER)
            await tab.keyboard.press(Key.A, modifiers=KeyModifier.CTRL)
        """
        logger.info(f'Pressing key: {key} with modifiers: {modifiers}')
        await self.down(key, modifiers)
        await asyncio.sleep(interval)
        await self.up(key)

    async def down(self, key: Key, modifiers: Optional[KeyModifier] = None):
        """
        Press a key down (without releasing).

        Args:
            key: Key to press down (from Key enum).
            modifiers: Optional key modifiers.
        """
        key_name, code = key
        logger.debug(f'Key down: {key_name}')
        command = InputCommands.dispatch_key_event(
            type=KeyEventType.KEY_DOWN,
            key=key_name,
            windows_virtual_key_code=code,
            native_virtual_key_code=code,
            modifiers=modifiers,
        )
        await self._executor._execute_command(command)

    async def up(self, key: Key):
        """
        Release a key (key up event).

        Args:
            key: Key to release (from Key enum).
        """
        key_name, code = key
        logger.debug(f'Key up: {key_name}')
        command = InputCommands.dispatch_key_event(
            type=KeyEventType.KEY_UP,
            key=key_name,
            windows_virtual_key_code=code,
            native_virtual_key_code=code,
        )
        await self._executor._execute_command(command)

    async def hotkey(self, key1: Key, key2: Key, key3: Optional[Key] = None):
        """
        Execute a key combination (hotkey) with up to 3 keys.

        Args:
            key1: First key (usually a modifier like Ctrl, Shift, Alt).
            key2: Second key.
            key3: Optional third key.

        Example:
            await tab.keyboard.hotkey(Key.CONTROL, Key.C)  # Ctrl+C
        """
        logger.info(f'Hotkey: {key1} + {key2}' + (f' + {key3}' if key3 else ''))
        keys = [key1, key2]
        if key3 is not None:
            keys.append(key3)

        modifiers, non_modifiers = self._split_modifiers_and_keys(keys)
        modifier_value = self._calculate_modifier_value(modifiers)

        for key in non_modifiers:
            await self.down(key, modifiers=modifier_value)
            await asyncio.sleep(0.05)

        await asyncio.sleep(0.1)

        for key in reversed(non_modifiers):
            await self.up(key)
            await asyncio.sleep(0.05)

    async def type_text(
        self,
        text: str,
        humanize: bool = False,
        interval: Optional[float] = None,
    ):
        """
        Type text character by character.

        Args:
            text: Text to type.
            humanize: When True, simulates human-like typing with
                variable delays and occasional typos (~2%).
            interval: Deprecated. Use humanize=True instead.

        Example:
            await tab.keyboard.type_text("Hello World", humanize=True)
            await tab.keyboard.type_text("Hello World")
        """
        if interval is not None:
            warnings.warn(
                'The "interval" parameter is deprecated and will be removed '
                'in a future version. Use "humanize=True" for realistic typing.',
                DeprecationWarning,
                stacklevel=2,
            )

        if humanize:
            await self._type_text_humanized(text)
            return

        for current_char in text:
            await self._type_char(current_char)
            await asyncio.sleep(0.05)

    async def _type_text_humanized(self, text: str):
        """Type text with realistic human-like behavior."""
        char_index = 0
        while char_index < len(text):
            current_char = text[char_index]
            next_char = text[char_index + 1] if char_index + 1 < len(text) else None

            should_skip_next = await self._process_char_with_typo(current_char, next_char)

            if should_skip_next:
                char_index += 1

            await self._apply_realistic_delay(current_char)
            char_index += 1

    async def _type_char(self, char: str):
        """Type a single character, re-focusing the element before each keystroke."""
        await self._ensure_focus()
        key, code, keycode = CHAR_TO_KEY_INFO.get(char, (char, '', 0))
        command_down = InputCommands.dispatch_key_event(
            type=KeyEventType.KEY_DOWN,
            key=key,
            code=code,
            text=char,
            unmodified_text=char,
            windows_virtual_key_code=keycode,
            native_virtual_key_code=keycode,
        )
        await self._executor._execute_command(command_down)

        command_up = InputCommands.dispatch_key_event(
            type=KeyEventType.KEY_UP,
            key=key,
            code=code,
            windows_virtual_key_code=keycode,
            native_virtual_key_code=keycode,
        )
        await self._executor._execute_command(command_up)

    async def _type_backspace(self):
        """Send backspace keypress."""
        await self._ensure_focus()
        await self.down(Key.BACKSPACE)
        await self.up(Key.BACKSPACE)

    async def _process_char_with_typo(
        self,
        current_char: str,
        next_char: Optional[str],
    ) -> bool:
        """Process character, potentially with typo. Returns True if next should be skipped."""
        if not self._should_make_typo():
            await self._type_char(current_char)
            return False

        typo = self._generate_typo(current_char, next_char)
        return await self._handle_typo(current_char, next_char, typo)

    async def _handle_typo(
        self,
        current_char: str,
        next_char: Optional[str],
        typo: TypoResult,
    ) -> bool:
        """Handle typo. Returns True if next char should be skipped."""
        if typo.typo_type == TypoType.ADJACENT:
            await self._do_adjacent_typo(current_char, typo.wrong_char)
            return False

        if typo.typo_type == TypoType.TRANSPOSE and next_char:
            await self._do_transpose_typo(current_char, next_char)
            return True

        if typo.typo_type == TypoType.DOUBLE:
            await self._do_double_typo(current_char)
            return False

        if typo.typo_type == TypoType.SKIP:
            await self._do_skip_typo(current_char)
            return False

        if typo.typo_type == TypoType.MISSED_SPACE and current_char == ' ' and next_char:
            await self._do_missed_space_typo(current_char, next_char)
            return True

        await self._type_char(current_char)
        return False

    async def _do_adjacent_typo(self, correct_char: str, wrong_char: str):
        """Type wrong adjacent key, pause, backspace, correct."""
        timing = self._timing
        await self._type_char(wrong_char)
        await asyncio.sleep(random.uniform(timing.mistake_realize_min, timing.mistake_realize_max))
        await self._type_backspace()
        await asyncio.sleep(
            random.uniform(timing.after_correction_min, timing.after_correction_max)
        )
        await self._type_char(correct_char)

    async def _do_transpose_typo(self, current_char: str, next_char: str):
        """Type chars in wrong order, then fix."""
        timing = self._timing
        await self._type_char(next_char)
        await asyncio.sleep(random.uniform(timing.keystroke_min, timing.keystroke_max))
        await self._type_char(current_char)

        await asyncio.sleep(random.uniform(timing.mistake_realize_min, timing.mistake_realize_max))
        await self._type_backspace()
        await self._type_backspace()
        await asyncio.sleep(
            random.uniform(timing.after_correction_min, timing.after_correction_max)
        )

        await self._type_char(current_char)
        await asyncio.sleep(random.uniform(timing.keystroke_min, timing.keystroke_max))
        await self._type_char(next_char)

    async def _do_double_typo(self, current_char: str):
        """Type character twice, then backspace."""
        timing = self._timing
        await self._type_char(current_char)
        await asyncio.sleep(random.uniform(timing.double_press_min, timing.double_press_max))
        await self._type_char(current_char)
        await asyncio.sleep(random.uniform(timing.mistake_realize_min, timing.mistake_realize_max))
        await self._type_backspace()

    async def _do_skip_typo(self, current_char: str):
        """Hesitate, then type normally."""
        timing = self._timing
        await asyncio.sleep(random.uniform(timing.hesitation_min, timing.hesitation_max))
        await self._type_char(current_char)

    async def _do_missed_space_typo(self, space_char: str, next_char: str):
        """Miss space, type next char, realize, go back and fix."""
        timing = self._timing
        await self._type_char(next_char)
        await asyncio.sleep(random.uniform(timing.mistake_realize_min, timing.mistake_realize_max))
        await self._type_backspace()
        await asyncio.sleep(
            random.uniform(timing.after_correction_min, timing.after_correction_max)
        )
        await self._type_char(space_char)
        await asyncio.sleep(
            random.uniform(timing.after_correction_min, timing.after_correction_max)
        )
        await self._type_char(next_char)

    async def _apply_realistic_delay(self, typed_char: str):
        """Apply realistic delay after typing a character."""
        timing = self._timing
        delay = random.uniform(timing.keystroke_min, timing.keystroke_max)

        if typed_char in self.PAUSE_CHARS:
            delay += random.uniform(timing.punctuation_min, timing.punctuation_max)

        if random.random() < timing.thinking_probability:
            delay += random.uniform(timing.thinking_min, timing.thinking_max)

        if random.random() < timing.distraction_probability:
            delay += random.uniform(timing.distraction_min, timing.distraction_max)

        await asyncio.sleep(delay)

    @staticmethod
    def _should_make_typo() -> bool:
        """Determine if a typo should occur."""
        return random.random() < DEFAULT_TYPO_PROBABILITY

    def _generate_typo(self, current_char: str, next_char: Optional[str]) -> TypoResult:
        """Generate a realistic typo based on QWERTY layout."""
        typo_type = self._select_typo_type()
        return self._create_typo(typo_type, current_char, next_char)

    def _select_typo_type(self) -> TypoType:
        """Select typo type based on weights."""
        config = self._typo_config
        typo_types = [
            TypoType.ADJACENT,
            TypoType.TRANSPOSE,
            TypoType.DOUBLE,
            TypoType.SKIP,
            TypoType.MISSED_SPACE,
        ]
        typo_weights = [
            config.adjacent_weight,
            config.transpose_weight,
            config.double_weight,
            config.skip_weight,
            config.missed_space_weight,
        ]
        return random.choices(typo_types, weights=typo_weights, k=1)[0]

    def _create_typo(
        self,
        typo_type: TypoType,
        current_char: str,
        next_char: Optional[str],
    ) -> TypoResult:
        """Create typo result based on type."""
        typo_handlers = {
            TypoType.ADJACENT: lambda: self._create_adjacent_typo(current_char),
            TypoType.TRANSPOSE: lambda: self._create_transpose_typo(current_char, next_char),
            TypoType.MISSED_SPACE: lambda: self._create_missed_space_typo(current_char),
            TypoType.DOUBLE: lambda: TypoResult(typo_type=TypoType.DOUBLE, wrong_char=current_char),
            TypoType.SKIP: lambda: TypoResult(typo_type=TypoType.SKIP),
        }
        handler = typo_handlers.get(typo_type, typo_handlers[TypoType.SKIP])
        return handler()

    def _create_transpose_typo(self, current_char: str, next_char: Optional[str]) -> TypoResult:
        """Create transpose typo, falling back to adjacent if not possible."""
        if next_char and next_char.isalpha():
            return TypoResult(typo_type=TypoType.TRANSPOSE, wrong_char=next_char)
        return self._create_adjacent_typo(current_char)

    def _create_missed_space_typo(self, current_char: str) -> TypoResult:
        """Create missed space typo, falling back to adjacent if not a space."""
        if current_char == ' ':
            return TypoResult(typo_type=TypoType.MISSED_SPACE)
        return self._create_adjacent_typo(current_char)

    @staticmethod
    def _create_adjacent_typo(original_char: str) -> TypoResult:
        """Create adjacent key typo."""
        lowercase_char = original_char.lower()

        if lowercase_char not in QWERTY_NEIGHBORS:
            return TypoResult(typo_type=TypoType.DOUBLE, wrong_char=original_char)

        adjacent_char = random.choice(QWERTY_NEIGHBORS[lowercase_char])

        if original_char.isupper():
            adjacent_char = adjacent_char.upper()

        return TypoResult(typo_type=TypoType.ADJACENT, wrong_char=adjacent_char)

    @staticmethod
    def _split_modifiers_and_keys(keys: list[Key]) -> tuple[list[Key], list[Key]]:
        """Split keys into modifiers and non-modifiers."""
        modifier_keys = {Key.CONTROL, Key.SHIFT, Key.ALT, Key.META}
        modifiers = [key for key in keys if key in modifier_keys]
        non_modifiers = [key for key in keys if key not in modifier_keys]
        return modifiers, non_modifiers

    @staticmethod
    def _calculate_modifier_value(modifiers: list[Key]) -> Optional[KeyModifier]:
        """Calculate KeyModifier value from modifier keys."""
        if not modifiers:
            return None

        modifier_map = {
            Key.ALT: 1,
            Key.CONTROL: 2,
            Key.META: 4,
            Key.SHIFT: 8,
        }

        value = sum(modifier_map.get(mod, 0) for mod in modifiers)
        return cast(KeyModifier, value) if value > 0 else None


KeyboardAPI = Keyboard


================================================
FILE: pydoll/interactions/mouse.py
================================================
from __future__ import annotations

import asyncio
import logging
import math
import random
from dataclasses import dataclass
from typing import TYPE_CHECKING, Optional

from pydoll.commands import InputCommands, RuntimeCommands
from pydoll.interactions.utils import (
    bezier_2d,
    fitts_duration,
    minimum_jerk,
    random_control_points,
)
from pydoll.protocol.input.types import MouseButton, MouseEventType

if TYPE_CHECKING:
    from pydoll.browser.tab import Tab

logger = logging.getLogger(__name__)


@dataclass(frozen=True)
class MouseTimingConfig:
    """Configuration for realistic mouse movement physics."""

    fitts_a: float = 0.070
    fitts_b: float = 0.150

    frame_interval: float = 0.012
    frame_interval_variance: float = 0.004

    curvature_min: float = 0.10
    curvature_max: float = 0.30
    curvature_asymmetry: float = 0.6

    short_distance_threshold: float = 50.0

    tremor_amplitude: float = 1.0

    overshoot_probability: float = 0.70
    overshoot_distance_min: float = 0.03
    overshoot_distance_max: float = 0.12
    overshoot_speed_threshold: float = 200.0

    pre_click_pause_min: float = 0.05
    pre_click_pause_max: float = 0.20
    click_hold_min: float = 0.05
    click_hold_max: float = 0.15
    double_click_interval_min: float = 0.05
    double_click_interval_max: float = 0.10
    drag_start_pause_min: float = 0.08
    drag_start_pause_max: float = 0.20
    drag_end_pause_min: float = 0.05
    drag_end_pause_max: float = 0.15

    micro_pause_probability: float = 0.03
    micro_pause_min: float = 0.015
    micro_pause_max: float = 0.04

    min_duration: float = 0.08
    max_duration: float = 2.5


class Mouse:
    """
    Mouse input controller with realistic humanized simulation.

    Provides methods for mouse movement, clicking, double-clicking,
    and dragging with optional humanized simulation using Bezier curves,
    Fitts's Law timing, minimum-jerk velocity profiles, physiological
    tremor, and overshoot correction.
    """

    _DEBUG_INIT_JS = """
    (() => {
        if (document.getElementById('__pydoll_mouse_debug')) return;
        const canvas = document.createElement('canvas');
        canvas.id = '__pydoll_mouse_debug';
        canvas.style.cssText = 'position:fixed;top:0;left:0;width:100vw;height:100vh;'
            + 'pointer-events:none;z-index:2147483647;';
        canvas.width = window.innerWidth;
        canvas.height = window.innerHeight;
        document.body.appendChild(canvas);
        window.__pydoll_debug_ctx = canvas.getContext('2d');
    })();
    """

    _DEBUG_DOT_JS = """
    (() => {{
        const ctx = window.__pydoll_debug_ctx;
        if (!ctx) return;
        ctx.beginPath();
        ctx.arc({x}, {y}, {radius}, 0, 2 * Math.PI);
        ctx.fillStyle = '{color}';
        ctx.fill();
    }})();
    """

    def __init__(
        self,
        tab: Tab,
        timing: Optional[MouseTimingConfig] = None,
        debug: bool = False,
    ):
        """
        Initialize mouse controller.

        Args:
            tab: Tab instance to execute mouse commands on.
            timing: Optional custom timing configuration for humanized movement.
            debug: Draw colored dots on the page to visualize mouse path.
        """
        self._tab = tab
        self._timing = timing or MouseTimingConfig()
        self._position: tuple[float, float] = (0.0, 0.0)
        self._debug = debug
        self._debug_initialized = False

    @property
    def timing(self) -> MouseTimingConfig:
        """Current timing configuration for humanized movement."""
        return self._timing

    @timing.setter
    def timing(self, config: MouseTimingConfig) -> None:
        """Replace the timing configuration.

        Args:
            config: New MouseTimingConfig to use for future operations.
        """
        self._timing = config

    @property
    def debug(self) -> bool:
        """Whether to draw debug dots on the page."""
        return self._debug

    @debug.setter
    def debug(self, value: bool) -> None:
        """Set whether to draw debug dots on the page."""
        self._debug = value
        self._debug_initialized = False

    async def move(
        self,
        x: float,
        y: float,
        *,
        humanize: bool = False,
    ) -> None:
        """
        Move mouse cursor to the specified position.

        Args:
            x: Target X coordinate (CSS pixels).
            y: Target Y coordinate (CSS pixels).
            humanize: Simulate human-like curved movement with natural timing.
        """
        if humanize:
            await self._move_humanized(x, y)
            return

        await self._dispatch_move(x, y)

    async def click(
        self,
        x: float,
        y: float,
        *,
        button: MouseButton = MouseButton.LEFT,
        click_count: int = 1,
        humanize: bool = False,
    ) -> None:
        """
        Click at the specified position.

        Args:
            x: Target X coordinate (CSS pixels).
            y: Target Y coordinate (CSS pixels).
            button: Mouse button to click.
            click_count: Number of clicks (2 for double-click).
            humanize: Simulate human-like movement and click timing.
        """
        if humanize:
            await self._click_humanized(x, y, button, click_count)
            return

        await self._dispatch_move(x, y)
        await self._dispatch_button(MouseEventType.MOUSE_PRESSED, button, click_count)
        await self._dispatch_button(MouseEventType.MOUSE_RELEASED, button, click_count)

    async def double_click(
        self,
        x: float,
        y: float,
        *,
        button: MouseButton = MouseButton.LEFT,
        humanize: bool = False,
    ) -> None:
        """
        Double-click at the specified position.

        Args:
            x: Target X coordinate (CSS pixels).
            y: Target Y coordinate (CSS pixels).
            button: Mouse button to click.
            humanize: Simulate human-like movement and click timing.
        """
        await self.click(x, y, button=button, click_count=2, humanize=humanize)

    async def down(self, button: MouseButton = MouseButton.LEFT) -> None:
        """
        Press mouse button down at the current position.

        Args:
            button: Mouse button to press.
        """
        await self._dispatch_button(MouseEventType.MOUSE_PRESSED, button)

    async def up(self, button: MouseButton = MouseButton.LEFT) -> None:
        """
        Release mouse button at the current position.

        Args:
            button: Mouse button to release.
        """
        await self._dispatch_button(MouseEventType.MOUSE_RELEASED, button)

    async def drag(
        self,
        start_x: float,
        start_y: float,
        end_x: float,
        end_y: float,
        *,
        humanize: bool = False,
    ) -> None:
        """
        Drag from one position to another.

        Args:
            start_x: Start X coordinate.
            start_y: Start Y coordinate.
            end_x: End X coordinate.
            end_y: End Y coordinate.
            humanize: Simulate human-like drag movement.
        """
        if humanize:
            await self._drag_humanized(start_x, start_y, end_x, end_y)
            return

        await self._dispatch_move(start_x, start_y)
        await self._dispatch_button(MouseEventType.MOUSE_PRESSED, MouseButton.LEFT)
        await self._dispatch_move(end_x, end_y)
        await self._dispatch_button(MouseEventType.MOUSE_RELEASED, MouseButton.LEFT)

    async def _move_humanized(self, target_x: float, target_y: float) -> None:
        """Move mouse with realistic curved path, timing, tremor, and overshoot."""
        start = self._position
        target = (target_x, target_y)
        distance = math.hypot(target_x - start[0], target_y - start[1])

        if distance < 1.0:
            await self._dispatch_move(target_x, target_y)
            return

        config = self._timing
        duration = fitts_duration(distance, 20.0, config.fitts_a, config.fitts_b)
        duration = max(config.min_duration, min(duration, config.max_duration))

        should_overshoot = (
            distance > config.overshoot_speed_threshold
            and random.random() < config.overshoot_probability
        )

        if should_overshoot:
            await self._move_with_overshoot(start, target, duration)
        else:
            cp1, cp2 = self._get_control_points(start, target)
            await self._perform_movement_loop(start, target, duration, cp1, cp2)

        await self._dispatch_move(target_x, target_y)

    async def _move_with_overshoot(
        self,
        start: tuple[float, float],
        target: tuple[float, float],
        duration: float,
    ) -> None:
        """Execute a movement that overshoots the target, then corrects."""
        config = self._timing
        overshoot_fraction = random.uniform(
            config.overshoot_distance_min, config.overshoot_distance_max
        )
        dx = target[0] - start[0]
        dy = target[1] - start[1]
        overshoot = (target[0] + dx * overshoot_fraction, target[1] + dy * overshoot_fraction)

        cp1, cp2 = self._get_control_points(start, overshoot)
        await self._perform_movement_loop(start, overshoot, duration * 0.85, cp1, cp2)

        cp1, cp2 = self._get_control_points(overshoot, target)
        await self._perform_movement_loop(overshoot, target, duration * 0.15, cp1, cp2)

    async def _perform_movement_loop(
        self,
        start: tuple[float, float],
        end: tuple[float, float],
        duration: float,
        cp1: tuple[float, float],
        cp2: tuple[float, float],
    ) -> None:
        """Execute the frame-by-frame movement loop using Bezier path and minimum jerk."""
        config = self._timing
        loop = asyncio.get_running_loop()
        start_time = loop.time()
        prev = (start[0], start[1], start_time)

        while True:
            now = loop.time()
            elapsed = now - start_time

            if elapsed >= duration:
                break

            t = minimum_jerk(elapsed / duration)
            x, y = bezier_2d(t, start, cp1, cp2, end)

            sigma = self._compute_tremor_sigma(x, y, now, prev, config)
            x += random.gauss(0, sigma)
            y += random.gauss(0, sigma)

            await self._dispatch_move(x, y)
            prev = (x, y, now)

            frame_delay = config.frame_interval + random.uniform(
                -config.frame_interval_variance, config.frame_interval_variance
            )
            await asyncio.sleep(max(0.001, frame_delay))

            if random.random() < config.micro_pause_probability:
                pause = random.uniform(config.micro_pause_min, config.micro_pause_max)
                await asyncio.sleep(pause)
                start_time += pause

    @staticmethod
    def _compute_tremor_sigma(
        x: float,
        y: float,
        now: float,
        prev: tuple[float, float, float],
        config: MouseTimingConfig,
    ) -> float:
        """Compute tremor amplitude scaled inversely with cursor velocity."""
        dt = now - prev[2]
        if dt > 0:
            velocity = math.hypot(x - prev[0], y - prev[1]) / dt
            speed_factor = max(0.2, 1.0 - velocity / 500.0)
        else:
            speed_factor = 1.0
        return config.tremor_amplitude * speed_factor

    async def _click_humanized(
        self,
        x: float,
        y: float,
        button: MouseButton,
        click_count: int,
    ) -> None:
        """Click with realistic movement and timing."""
        config = self._timing

        await self._move_humanized(x, y)

        pre_pause = random.uniform(config.pre_click_pause_min, config.pre_click_pause_max)
        await asyncio.sleep(pre_pause)

        for i in range(click_count):
            current_count = i + 1
            await self._dispatch_button(MouseEventType.MOUSE_PRESSED, button, current_count)

            hold = random.uniform(config.click_hold_min, config.click_hold_max)
            await asyncio.sleep(hold)

            await self._dispatch_button(MouseEventType.MOUSE_RELEASED, button, current_count)

            if current_count < click_count:
                interval = random.uniform(
                    config.double_click_interval_min,
                    config.double_click_interval_max,
                )
                await asyncio.sleep(interval)

    async def _drag_humanized(
        self,
        start_x: float,
        start_y: float,
        end_x: float,
        end_y: float,
    ) -> None:
        """Drag with realistic movement, pauses, and timing."""
        config = self._timing

        await self._move_humanized(start_x, start_y)
        await self._dispatch_button(MouseEventType.MOUSE_PRESSED, MouseButton.LEFT)

        drag_start_pause = random.uniform(config.drag_start_pause_min, config.drag_start_pause_max)
        await asyncio.sleep(drag_start_pause)

        start = self._position
        distance = math.hypot(end_x - start[0], end_y - start[1])
        duration = fitts_duration(distance, 20.0, config.fitts_a, config.fitts_b)
        duration = max(config.min_duration, min(duration, config.max_duration))

        cp1, cp2 = self._get_control_points(start, (end_x, end_y))
        await self._perform_movement_loop(start, (end_x, end_y), duration, cp1, cp2)
        await self._dispatch_move(end_x, end_y)

        drag_end_pause = random.uniform(config.drag_end_pause_min, config.drag_end_pause_max)
        await asyncio.sleep(drag_end_pause)

        await self._dispatch_button(MouseEventType.MOUSE_RELEASED, MouseButton.LEFT)

    def _get_control_points(
        self,
        start: tuple[float, float],
        end: tuple[float, float],
    ) -> tuple[tuple[float, float], tuple[float, float]]:
        """Generate Bezier control points using current timing config."""
        config = self._timing
        return random_control_points(
            start,
            end,
            config.curvature_min,
            config.curvature_max,
            config.curvature_asymmetry,
            config.short_distance_threshold,
        )

    async def _dispatch_move(self, x: float, y: float) -> None:
        """Dispatch a mouseMoved event and update internal position."""
        command = InputCommands.dispatch_mouse_event(
            type=MouseEventType.MOUSE_MOVED,
            x=int(round(x)),
            y=int(round(y)),
        )
        await self._tab._execute_command(command)
        self._position = (x, y)

        if self._debug:
            await self._debug_draw_dot(x, y, radius=2, color='rgba(0,150,255,0.6)')

    async def _dispatch_button(
        self,
        event_type: MouseEventType,
        button: MouseButton,
        click_count: int = 1,
    ) -> None:
        """Dispatch mousePressed or mouseReleased at current position."""
        command = InputCommands.dispatch_mouse_event(
            type=event_type,
            x=int(round(self._position[0])),
            y=int(round(self._position[1])),
            button=button,
            click_count=click_count,
        )
        await self._tab._execute_command(command)

        if self._debug and event_type == MouseEventType.MOUSE_PRESSED:
            await self._debug_draw_dot(
                self._position[0], self._position[1], radius=6, color='rgba(255,50,50,0.9)'
            )

    async def _debug_draw_dot(self, x: float, y: float, radius: int, color: str) -> None:
        """Draw a debug dot on the page overlay canvas."""
        if not self._debug_initialized:
            await self._tab._execute_command(RuntimeCommands.evaluate(self._DEBUG_INIT_JS))
            self._debug_initialized = True

        script = self._DEBUG_DOT_JS.format(
            x=int(round(x)), y=int(round(y)), radius=radius, color=color
        )
        await self._tab._execute_command(RuntimeCommands.evaluate(script))


MouseAPI = Mouse


================================================
FILE: pydoll/interactions/scroll.py
================================================
from __future__ import annotations

import asyncio
import json
import random
from dataclasses import dataclass
from typing import TYPE_CHECKING, Optional

from pydoll.commands import InputCommands, RuntimeCommands
from pydoll.constants import Scripts, ScrollPosition
from pydoll.interactions.utils import CubicBezier
from pydoll.protocol.input.types import MouseEventType
from pydoll.protocol.runtime.methods import EvaluateResponse

if TYPE_CHECKING:
    from pydoll.browser.tab import Tab


@dataclass(frozen=True)
class ScrollTimingConfig:
    """Configuration for realistic scroll physics."""

    min_duration: float = 0.5
    max_duration: float = 1.5

    bezier_points: tuple[float, float, float, float] = (0.645, 0.045, 0.355, 1.0)

    frame_interval: float = 0.012

    delta_jitter: int = 3

    micro_pause_probability: float = 0.05
    micro_pause_min: float = 0.02
    micro_pause_max: float = 0.05

    overshoot_probability: float = 0.15
    overshoot_factor_min: float = 1.02
    overshoot_factor_max: float = 1.08


class Scroll:
    """
    API for controlling page scroll behavior.

    Provides methods for scrolling the page in different directions,
    to specific positions, or by relative distances. Supports humanized
    scrolling with realistic physics simulation.
    """

    def __init__(
        self,
        tab: Tab,
        timing: Optional[ScrollTimingConfig] = None,
    ):
        """
        Initialize the Scroll with a Tab instance.

        Args:
            tab: Tab instance to execute scroll commands on.
            timing: Optional custom timing configuration for humanized scroll.
        """
        self._tab = tab
        self._timing = timing or ScrollTimingConfig()

    async def by(
        self,
        position: ScrollPosition,
        distance: int | float,
        smooth: bool = True,
        humanize: bool = False,
    ):
        """
        Scroll the page by a relative distance in the specified direction.

        Args:
            position: Direction to scroll (UP, DOWN, LEFT, RIGHT).
            distance: Number of pixels to scroll.
            smooth: Use smooth scrolling animation if True, instant if False.
            humanize: Simulate human-like scrolling with momentum and inertia.
        """
        if humanize:
            await self._scroll_humanized(position, distance)
            return

        axis, scroll_distance = self._get_axis_and_distance(position, distance)
        behavior = self._get_behavior(smooth)

        script = Scripts.SCROLL_BY.format(
            axis=axis,
            distance=scroll_distance,
            behavior=behavior,
        )

        await self._execute_script_await_promise(script)

    async def to_top(self, smooth: bool = True, humanize: bool = False):
        """
        Scroll to the top of the page (Y=0).

        Args:
            smooth: Use smooth scrolling animation if True, instant if False.
            humanize: Simulate human-like scrolling with momentum and inertia.
        """
        if humanize:
            await self._scroll_to_end_humanized(ScrollPosition.UP)
            return

        behavior = self._get_behavior(smooth)
        script = Scripts.SCROLL_TO_TOP.format(behavior=behavior)
        await self._execute_script_await_promise(script)

    async def to_bottom(self, smooth: bool = True, humanize: bool = False):
        """
        Scroll to the bottom of the page (Y=document.body.scrollHeight).

        Args:
            smooth: Use smooth scrolling animation if True, instant if False.
            humanize: Simulate human-like scrolling with momentum and inertia.
        """
        if humanize:
            await self._scroll_to_end_humanized(ScrollPosition.DOWN)
            return

        behavior = self._get_behavior(smooth)
        script = Scripts.SCROLL_TO_BOTTOM.format(behavior=behavior)
        await self._execute_script_await_promise(script)

    async def _scroll_to_end_humanized(self, position: ScrollPosition):
        """
        Scroll to top or bottom with multiple human-like flicks.

        Humans don't scroll thousands of pixels in one motion - they do
        multiple scroll gestures with brief pauses in between.
        """
        max_flick_distance = random.uniform(600, 1200)
        min_remaining_threshold = 30
        min_stuck_threshold = 5
        min_flick_distance = 100

        # Failsafe for stuck scroll
        last_remaining = float('inf')
        stuck_counter = 0
        max_stuck_attempts = 10

        while True:
            if position == ScrollPosition.DOWN:
                remaining = await self._get_remaining_scroll_to_bottom()
            else:
                remaining = await self._get_current_scroll_y()

            if remaining <= min_remaining_threshold:
                break

            # Check if we are stuck
            has_progressed = abs(remaining - last_remaining) >= min_stuck_threshold

            if has_progressed:
                stuck_counter = 0

            if not has_progressed:
                stuck_counter += 1
                if stuck_counter >= max_stuck_attempts:
                    break

            last_remaining = remaining

            flick_distance = min(remaining, max_flick_distance)
            if flick_distance < min_flick_distance and remaining > min_flick_distance:
                flick_distance = min_flick_distance

            await self._scroll_humanized(position, flick_distance)

            pause = random.uniform(0.05, 0.15)
            await asyncio.sleep(pause)

            max_flick_distance = random.uniform(600, 1200)

    async def _scroll_humanized(self, position: ScrollPosition, target_distance: float):
        """
        Perform scroll with realistic human-like physics.

        Simulates momentum-based scrolling with:
        - Smooth deceleration curve
        - Variable frame intervals
        - Random jitter in scroll deltas
        - Occasional micro-pauses
        - Optional overshoot and correction
        """
        is_vertical = position in {ScrollPosition.UP, ScrollPosition.DOWN}
        direction = -1 if position in {ScrollPosition.UP, ScrollPosition.LEFT} else 1

        effective_distance = self._calculate_effective_distance(target_distance)
        duration = self._calculate_duration(effective_distance)

        scrolled_so_far = await self._perform_scroll_loop(
            effective_distance, duration, is_vertical, direction
        )

        if effective_distance > target_distance and scrolled_so_far > target_distance:
            correction_distance = scrolled_so_far - target_distance
            correction_direction = -direction

            await asyncio.sleep(random.uniform(0.1, 0.2))

            await self._scroll_correction(
                is_vertical=is_vertical,
                direction=correction_direction,
                distance=correction_distance,
            )

    async def _perform_scroll_loop(
        self,
        effective_distance: float,
        duration: float,
        is_vertical: bool,
        direction: int,
    ) -> float:
        """Execute the main scroll loop using Bezier timing."""
        timing = self._timing
        bezier = CubicBezier(*timing.bezier_points)

        start_time = asyncio.get_running_loop().time()
        current_time = 0.0
        scrolled_so_far = 0.0

        while current_time < duration:
            now = asyncio.get_running_loop().time()
            current_time = now - start_time

            if current_time >= duration:
                break

            progress = current_time / duration
            eased_progress = bezier.solve(progress)

            target_pos = effective_distance * eased_progress
            delta = target_pos - scrolled_so_far

            jitter = random.randint(-timing.delta_jitter, timing.delta_jitter)
            delta += jitter

            delta = max(delta, 0)

            if delta >= 1:
                await self._dispatch_scroll_event(
                    delta_x=0 if is_vertical else int(delta * direction),
                    delta_y=int(delta * direction) if is_vertical else 0,
                )
                scrolled_so_far += delta

            frame_delay = timing.frame_interval + random.uniform(-0.002, 0.002)
            await asyncio.sleep(frame_delay)

            if random.random() < timing.micro_pause_probability:
                pause_duration = random.uniform(timing.micro_pause_min, timing.micro_pause_max)
                await asyncio.sleep(pause_duration)
                start_time += pause_duration

        return scrolled_so_far

    def _calculate_effective_distance(self, target_distance: float) -> float:
        """Calculate effective distance including overshoot."""
        timing = self._timing
        should_overshoot = random.random() < timing.overshoot_probability
        overshoot_factor = (
            random.uniform(timing.overshoot_factor_min, timing.overshoot_factor_max)
            if should_overshoot
            else 1.0
        )
        return target_distance * overshoot_factor

    def _calculate_duration(self, distance: float) -> float:
        """Calculate scroll duration based on distance."""
        timing = self._timing
        base_duration = random.uniform(timing.min_duration, timing.max_duration)
        duration = base_duration * (1 + 0.2 * (distance / 1000))
        return min(duration, 3.0)

    async def _scroll_correction(self, is_vertical: bool, direction: int, distance: float):
        """Perform small correction scroll after overshoot."""
        timing = self._timing
        scrolled = 0.0

        min_correction_velocity = (distance * (0.15)) / timing.frame_interval
        correction_velocity = random.uniform(
            max(200, min_correction_velocity), max(400, min_correction_velocity * 1.5)
        )

        while scrolled < distance:
            frame_delta = correction_velocity * timing.frame_interval
            frame_delta = min(frame_delta, distance - scrolled)

            await self._dispatch_scroll_event(
                delta_x=0 if is_vertical else int(frame_delta * direction),
                delta_y=int(frame_delta * direction) if is_vertical else 0,
            )

            scrolled += frame_delta
            correction_velocity *= 0.85

            await asyncio.sleep(timing.frame_interval)

    async def _dispatch_scroll_event(self, delta_x: int, delta_y: int):
        """Dispatch a mouse wheel event for scrolling."""
        viewport = await self._get_viewport_center()
        command = InputCommands.dispatch_mouse_event(
            type=MouseEventType.MOUSE_WHEEL,
            x=viewport[0],
            y=viewport[1],
            delta_x=delta_x,
            delta_y=delta_y,
        )
        await self._tab._execute_command(command)

    async def _get_viewport_center(self) -> tuple[int, int]:
        """Get the center coordinates of the viewport."""
        command = RuntimeCommands.evaluate(expression=Scripts.GET_VIEWPORT_CENTER)
        result: EvaluateResponse = await self._tab._execute_command(command)

        value_str = result.get('result', {}).get('result', {}).get('value', '[]')
        expected_dimensions = 2
        try:
            value = json.loads(value_str)
            if value and isinstance(value, list) and len(value) == expected_dimensions:
                return (int(value[0]), int(value[1]))
        except (json.JSONDecodeError, TypeError):
            pass
        return (400, 300)

    async def _get_current_scroll_y(self) -> float:
        """Get current vertical scroll position."""
        command = RuntimeCommands.evaluate(expression=Scripts.GET_SCROLL_Y)
        result: EvaluateResponse = await self._tab._execute_command(command)
        return float(result.get('result', {}).get('result', {}).get('value', 0))

    async def _get_remaining_scroll_to_bottom(self) -> float:
        """Get remaining distance to scroll to reach the bottom."""
        command = RuntimeCommands.evaluate(expression=Scripts.GET_REMAINING_SCROLL_TO_BOTTOM)
        result: EvaluateResponse = await self._tab._execute_command(command)
        return float(result.get('result', {}).get('result', {}).get('value', 0))

    @staticmethod
    def _get_axis_and_distance(
        position: ScrollPosition, distance: int | float
    ) -> tuple[str, int | float]:
        """
        Convert scroll position to axis and signed distance.

        Args:
            position: Direction to scroll.
            distance: Absolute distance to scroll.

        Returns:
            Tuple of (axis, signed_distance) where axis is 'left' or 'top'
            and signed_distance is positive or negative based on direction.
        """
        if position in {ScrollPosition.UP, ScrollPosition.DOWN}:
            axis = 'top'
            scroll_distance = -distance if position == ScrollPosition.UP else distance
            return axis, scroll_distance

        axis = 'left'
        scroll_distance = -distance if position == ScrollPosition.LEFT else distance
        return axis, scroll_distance

    @staticmethod
    def _get_behavior(smooth: bool) -> str:
        """
        Convert smooth boolean to CSS scroll behavior value.

        Args:
            smooth: Whether to use smooth scrolling.

        Returns:
            'smooth' if smooth is True, 'auto' otherwise.
        """
        return 'smooth' if smooth else 'auto'

    async def _execute_script_await_promise(self, script: str):
        """
        Execute JavaScript and await promise resolution.

        Args:
            script: JavaScript code that returns a Promise.
        """
        command = RuntimeCommands.evaluate(expression=script, await_promise=True)
        return await self._tab._execute_command(command)


# Backward compatibility alias
ScrollAPI = Scroll


================================================
FILE: pydoll/interactions/utils.py
================================================
from __future__ import annotations

import math
import random


class CubicBezier:
    """Cubic Bezier curve solver for smooth animation timing.

    Based on UnitBezier from WebKit/Chromium. Maps a time progress value
    to an eased progress value using a cubic Bezier curve.
    """

    def __init__(self, point1_x: float, point1_y: float, point2_x: float, point2_y: float):
        self.coefficient_c_x = 3.0 * point1_x
        self.coefficient_b_x = 3.0 * (point2_x - point1_x) - self.coefficient_c_x
        self.coefficient_a_x = 1.0 - self.coefficient_c_x - self.coefficient_b_x

        self.coefficient_c_y = 3.0 * point1_y
        self.coefficient_b_y = 3.0 * (point2_y - point1_y) - self.coefficient_c_y
        self.coefficient_a_y = 1.0 - self.coefficient_c_y - self.coefficient_b_y

    def sample_curve_x(self, time_progress: float) -> float:
        return (
            (self.coefficient_a_x * time_progress + self.coefficient_b_x) * time_progress
            + self.coefficient_c_x
        ) * time_progress

    def sample_curve_y(self, time_progress: float) -> float:
        return (
            (self.coefficient_a_y * time_progress + self.coefficient_b_y) * time_progress
            + self.coefficient_c_y
        ) * time_progress

    def sample_curve_derivative_x(self, time_progress: float) -> float:
        return (
            3.0 * self.coefficient_a_x * time_progress + 2.0 * self.coefficient_b_x
        ) * time_progress + self.coefficient_c_x

    def solve_curve_x(self, target_x: float, epsilon: float = 1e-6) -> float:
        """Given an x value, find the corresponding t value."""
        estimated_t = target_x

        for _ in range(8):
            current_x = self.sample_curve_x(estimated_t) - target_x
            if abs(current_x) < epsilon:
                return estimated_t
            derivative = self.sample_curve_derivative_x(estimated_t)
            if abs(derivative) < epsilon:
                break
            estimated_t -= current_x / derivative

        lower_bound = 0.0
        upper_bound = 1.0
        estimated_t = target_x

        if estimated_t < lower_bound:
            return lower_bound
        if estimated_t > upper_bound:
            return upper_bound

        while lower_bound < upper_bound:
            current_x = self.sample_curve_x(estimated_t)
            if abs(current_x - target_x) < epsilon:
                return estimated_t
            if target_x > current_x:
                lower_bound = estimated_t
            else:
                upper_bound = estimated_t
            estimated_t = (upper_bound - lower_bound) * 0.5 + lower_bound

        return estimated_t

    def solve(self, input_x: float) -> float:
        """Get y value for a given x (time progress)."""
        return self.sample_curve_y(self.solve_curve_x(input_x))


def minimum_jerk(t: float) -> float:
    """Minimum jerk position at normalized time t in [0,1].

    Returns 10t^3 - 15t^4 + 6t^5 which produces a bell-shaped velocity
    profile: slow start, peak in middle, slow end.
    """
    t2 = t * t
    t3 = t2 * t
    return 10.0 * t3 - 15.0 * t3 * t + 6.0 * t3 * t2


def bezier_2d(
    t: float,
    p0: tuple[float, float],
    p1: tuple[float, float],
    p2: tuple[float, float],
    p3: tuple[float, float],
) -> tuple[float, float]:
    """Evaluate 2D cubic Bezier at parameter t.

    B(t) = (1-t)^3*P0 + 3(1-t)^2*t*P1 + 3(1-t)*t^2*P2 + t^3*P3
    """
    u = 1.0 - t
    u2 = u * u
    u3 = u2 * u
    t2 = t * t
    t3 = t2 * t
    x = u3 * p0[0] + 3.0 * u2 * t * p1[0] + 3.0 * u * t2 * p2[0] + t3 * p3[0]
    y = u3 * p0[1] + 3.0 * u2 * t * p1[1] + 3.0 * u * t2 * p2[1] + t3 * p3[1]
    return (x, y)


def fitts_duration(
    distance: float,
    target_width: float,
    a: float,
    b: float,
) -> float:
    """Fitts's Law: MT = a + b * log2(D/W + 1)."""
    if distance <= 0:
        return a
    return a + b * math.log2(distance / target_width + 1.0)


def random_control_points(
    start: tuple[float, float],
    end: tuple[float, float],
    curvature_min: float,
    curvature_max: float,
    curvature_asymmetry: float,
    short_distance_threshold: float,
) -> tuple[tuple[float, float], tuple[float, float]]:
    """Generate randomized 2D Bezier control points for a curved mouse path.

    Control points are offset perpendicular to the start-end line.
    The first control point is biased earlier along the path
    (ballistic phase asymmetry).
    """
    dx = end[0] - start[0]
    dy = end[1] - start[1]
    distance = math.hypot(dx, dy)

    if distance < 1.0:
        return (start, end)

    perp = (-dy / distance, dx / distance)

    scale = min(1.0, distance / short_distance_threshold)
    offsets = (
        random.uniform(curvature_min, curvature_max) * distance * scale,
        random.uniform(curvature_min, curvature_max) * distance * scale,
    )

    sign = random.choice([-1.0, 1.0])
    t1 = random.uniform(0.2, curvature_asymmetry)
    t2 = random.uniform(curvature_asymmetry, 0.8)

    cp1 = (
        start[0] + dx * t1 + perp[0] * offsets[0] * sign,
        start[1] + dy * t1 + perp[1] * offsets[0] * sign,
    )

    counter = random.uniform(0.3, 1.0)
    cp2 = (
        start[0] + dx * t2 + perp[0] * offsets[1] * sign * counter,
        start[1] + dy * t2 + perp[1] * offsets[1] * sign * counter,
    )

    return (cp1, cp2)


================================================
FILE: pydoll/protocol/__init__.py
================================================
"""Chrome DevTools Protocol implementation."""


================================================
FILE: pydoll/protocol/base.py
================================================
from typing import Generic, TypeVar

# TODO: typeddict comes from typing_extensions
from typing_extensions import NotRequired, TypedDict

T_CommandParams = TypeVar('T_CommandParams')
T_CommandResponse = TypeVar('T_CommandResponse')
T_EventParams = TypeVar('T_EventParams')


class EmptyParams(TypedDict):
    """Empty parameters for commands."""

    pass


class EmptyResponse(TypedDict):
    """Empty response for commands."""

    pass


class Command(TypedDict, Generic[T_CommandParams, T_CommandResponse]):
    """Base structure for all commands.

    Attributes:
        method: The command method name
        params: Optional dictionary of parameters for the command
        sessionId: Optional target session identifier (flattened sessions)
    """

    id: NotRequired[int]
    method: str
    params: NotRequired[T_CommandParams]
    sessionId: NotRequired[str]


class Response(TypedDict, Generic[T_CommandResponse]):
    """Base structure for all responses.

    Attributes:
        id: The ID that matches the command ID
        result: The result data for the command
        sessionId: Optional target session identifier (flattened sessions)
    """

    id: int
    result: T_CommandResponse
    sessionId: NotRequired[str]


class CDPEvent(TypedDict, Generic[T_EventParams]):
    """Base structure for all events."""

    method: str
    params: NotRequired[T_EventParams]
    sessionId: NotRequired[str]


================================================
FILE: pydoll/protocol/browser/__init__.py
================================================
"""Browser domain implementation."""


================================================
FILE: pydoll/protocol/browser/events.py
================================================
from enum import Enum

from typing_extensions import NotRequired, TypedDict

from pydoll.protocol.base import CDPEvent
from pydoll.protocol.browser.types import DownloadProgressState


class BrowserEvent(str, Enum):
    """
    Events from the Browser domain of the Chrome DevTools Protocol.

    This enumeration contains the names of browser-related events that can be
    received from the Chrome DevTools Protocol. These events provide information
    about browser activities and state changes.
    """

    DOWNLOAD_PROGRESS = 'Browser.downloadProgress'
    """
    Fired when download makes progress. The last call has |done| == true.

    Args:
        guid (str): Global unique identifier of the download.
        totalBytes (int): Total expected bytes to download.
        receivedBytes (int): Total bytes received.
        state (str): Download status.
            Allowed values: 'inProgress', 'completed', 'canceled'
    """

    DOWNLOAD_WILL_BEGIN = 'Browser.downloadWillBegin'
    """
    Fired when page is about to start a download.

    Args:
        frameId (str): Id of the frame that caused the download to begin.
        guid (str): Global unique identifier of the download.
        url (str): URL of the resource being downloaded.
        suggestedFilename (str): Suggested file name of the resource
            (the actual name of the file saved on disk may differ).
    """


class DownloadProgressEventParams(TypedDict):
    guid: str
    totalBytes: float
    receivedBytes: float
    state: DownloadProgressState
    filePath: NotRequired[str]


class DownloadWillBeginEventParams(TypedDict):
    frameId: str
    guid: str
    url: str
    suggestedFilename: str


DownloadProgressEvent = CDPEvent[DownloadProgressEventParams]
DownloadWillBeginEvent = CDPEvent[DownloadWillBeginEventParams]


================================================
FILE: pydoll/protocol/browser/methods.py
================================================
from enum import Enum

from typing_extensions import NotRequired, TypedDict

from pydoll.protocol.base import Command, EmptyParams, EmptyResponse, Response
from pydoll.protocol.browser.types import (
    Bounds,
    BrowserCommandId,
    BrowserContextID,
    DownloadBehavior,
    Histogram,
    PermissionDescriptor,
    PermissionSetting,
    PermissionType,
    PrivacySandboxAPI,
    WindowID,
)


class BrowserMethod(str, Enum):
    """Browser domain method names."""

    ADD_PRIVACY_SANDBOX_COORDINATOR_KEY_CONFIG = 'Browser.addPrivacySandboxCoordinatorKeyConfig'
    ADD_PRIVACY_SANDBOX_ENROLLMENT_OVERRIDE = 'Browser.addPrivacySandboxEnrollmentOverride'
    CANCEL_DOWNLOAD = 'Browser.cancelDownload'
    CLOSE = 'Browser.close'
    CRASH = 'Browser.crash'
    CRASH_GPU_PROCESS = 'Browser.crashGpuProcess'
    EXECUTE_BROWSER_COMMAND = 'Browser.executeBrowserCommand'
    GET_BROWSER_COMMAND_LINE = 'Browser.getBrowserCommandLine'
    GET_HISTOGRAM = 'Browser.getHistogram'
    GET_HISTOGRAMS = 'Browser.getHistograms'
    GET_VERSION = 'Browser.getVersion'
    GET_WINDOW_BOUNDS = 'Browser.getWindowBounds'
    GET_WINDOW_FOR_TARGET = 'Browser.getWindowForTarget'
    GRANT_PERMISSIONS = 'Browser.grantPermissions'
    RESET_PERMISSIONS = 'Browser.resetPermissions'
    SET_CONTENTS_SIZE = 'Browser.setContentsSize'
    SET_DOCK_TILE = 'Browser.setDockTile'
    SET_DOWNLOAD_BEHAVIOR = 'Browser.setDownloadBehavior'
    SET_PERMISSION = 'Browser.setPermission'
    SET_WINDOW_BOUNDS = 'Browser.setWindowBounds'


class SetPermissionParams(TypedDict):
    """Parameters for setting permission settings for given origin."""

    permission: PermissionDescriptor
    setting: PermissionSetting
    origin: NotRequired[str]
    browserContextId: NotRequired[BrowserContextID]


class GrantPermissionsParams(TypedDict):
    """Parameters for granting specific permissions to the given origin."""

    permissions: list[PermissionType]
    origin: NotRequired[str]
    browserContextId: NotRequired[BrowserContextID]


class ResetPermissionsParams(TypedDict):
    """Parameters for resetting all permission management for all origins."""

    browserContextId: NotRequired[BrowserContextID]


class SetDownloadBehaviorParams(TypedDict):
    """Parameters for setting the behavior when downloading a file."""

    behavior: DownloadBehavior
    browserContextId: NotRequired[BrowserContextID]
    downloadPath: NotRequired[str]
    eventsEnabled: NotRequired[bool]


class CancelDownloadParams(TypedDict):
    """Parameters for cancelling a download if in progress."""

    guid: str
    browserContextId: NotRequired[BrowserContextID]


class GetHistogramsParams(TypedDict):
    """Parameters for getting Chrome histograms."""

    query: NotRequired[str]
    delta: NotRequired[bool]


class GetHistogramParams(TypedDict):
    """Parameters for getting a Chrome histogram by name."""

    name: str
    delta: NotRequired[bool]


class GetWindowBoundsParams(TypedDict):
    """Parameters for getting position and size of the browser window."""

    windowId: WindowID


class GetWindowForTargetParams(TypedDict):
    """Parameters for getting the browser window that contains the devtools target."""

    targetId: NotRequired[str]  # Target.TargetID


class SetWindowBoundsParams(TypedDict):
    """Parameters for setting position and/or size of the browser window."""

    windowId: WindowID
    bounds: Bounds


class SetContentsSizeParams(TypedDict):
    """Parameters for setting size of the browser contents."""

    windowId: WindowID
    width: NotRequired[int]
    height: NotRequired[int]


class SetDockTileParams(TypedDict):
    """Parameters for setting dock tile details, platform-specific."""

    badgeLabel: NotRequired[str]
    image: NotRequired[str]  # Png encoded image (base64)


class ExecuteBrowserCommandParams(TypedDict):
    """Parameters for invoking custom browser commands used by telemetry."""

    commandId: BrowserCommandId


class AddPrivacySandboxEnrollmentOverrideParams(TypedDict):
    """Parameters for allowing a site to use privacy sandbox features without enrollment."""

    url: str


class AddPrivacySandboxCoordinatorKeyConfigParams(TypedDict):
    """Parameters for configuring encryption keys for privacy sandbox API."""

    api: PrivacySandboxAPI
    coordinatorOrigin: str
    keyConfig: str
    browserContextId: NotRequired[BrowserContextID]


# Result types
class GetVersionResult(TypedDict):
    """Result for getVersion command."""

    protocolVersion: str
    product: str
    revision: str
    userAgent: str
    jsVersion: str


class GetBrowserCommandLineResult(TypedDict):
    """Result for getBrowserCommandLine command."""

    arguments: list[str]


class GetHistogramsResult(TypedDict):
    """Result for getHistograms command."""

    histograms: list[Histogram]


class GetHistogramResult(TypedDict):
    """Result for getHistogram command."""

    histogram: Histogram


class GetWindowBoundsResult(TypedDict):
    """Result for getWindowBounds command."""

    bounds: Bounds


class GetWindowForTargetResult(TypedDict):
    """Result for getWindowForTarget command."""

    windowId: WindowID
    bounds: Bounds


# Response types
GetVersionResponse = Response[GetVersionResult]
GetBrowserCommandLineResponse = Response[GetBrowserCommandLineResult]
GetHistogramsResponse = Response[GetHistogramsResult]
GetHistogramResponse = Response[GetHistogramResult]
GetWindowBoundsResponse = Response[GetWindowBoundsResult]
GetWindowForTargetResponse = Response[GetWindowForTargetResult]


# Command types
AddPrivacySandboxCoordinatorKeyConfigCommand = Command[
    AddPrivacySandboxCoordinatorKeyConfigParams, Response[EmptyResponse]
]
AddPrivacySandboxEnrollmentOverrideCommand = Command[
    AddPrivacySandboxEnrollmentOverrideParams, Response[EmptyResponse]
]
CancelDownloadCommand = Command[CancelDownloadParams, Response[EmptyResponse]]
CloseCommand = Command[EmptyParams, Response[EmptyResponse]]
CrashCommand = Command[EmptyParams, Response[EmptyResponse]]
CrashGpuProcessCommand = Command[EmptyParams, Response[EmptyResponse]]
ExecuteBrowserCommandCommand = Command[ExecuteBrowserCommandParams, Response[EmptyResponse]]
GetBrowserCommandLineCommand = Command[EmptyParams, GetBrowserCommandLineResponse]
GetHistogramCommand = Command[GetHistogramParams, GetHistogramResponse]
GetHistogramsCommand = Command[GetHistogramsParams, GetHistogramsResponse]
GetVersionCommand = Command[EmptyParams, GetVersionResponse]
GetWindowBoundsCommand = Command[GetWindowBoundsParams, GetWindowBoundsResponse]
GetWindowForTargetCommand = Command[GetWindowForTargetParams, GetWindowForTargetResponse]
GrantPermissionsCommand = Command[GrantPermissionsParams, Response[EmptyResponse]]
ResetPermissionsCommand = Command[ResetPermissionsParams, Response[EmptyResponse]]
SetContentsSizeCommand = Command[SetContentsSizeParams, Response[EmptyResponse]]
SetDockTileCommand = Command[SetDockTileParams, Response[EmptyResponse]]
SetDownloadBehaviorCommand = Command[SetDownloadBehaviorParams, Response[EmptyResponse]]
SetPermissionCommand = Command[SetPermissionParams, Response[EmptyResponse]]
SetWindowBoundsCommand = Command[SetWindowBoundsParams, Response[EmptyResponse]]


================================================
FILE: pydoll/protocol/browser/types.py
================================================
from enum import Enum

from typing_extensions import TypedDict

BrowserContextID = str
WindowID = int


class WindowState(str, Enum):
    """The state of the browser window."""

    NORMAL = 'normal'
    MINIMIZED = 'minimized'
    MAXIMIZED = 'maximized'
    FULLSCREEN = 'fullscreen'


class DownloadBehavior(str, Enum):
    """Download behavior options."""

    DENY = 'deny'
    ALLOW = 'allow'
    ALLOW_AND_NAME = 'allowAndName'
    DEFAULT = 'default'


class DownloadProgressState(str, Enum):
    """Download progress state."""

    IN_PROGRESS = 'inProgress'
    COMPLETED = 'completed'
    CANCELED = 'canceled'


class Bounds(TypedDict, total=False):
    """Browser window bounds information."""

    left: int  # The offset from the left edge of the screen to the window in pixels.
    top: int  # The offset from the top edge of the screen to the window in pixels.
    width: int  # The window width in pixels.
    height: int  # The window height in pixels.
    windowState: WindowState  # The window state. Default to normal.


class PermissionType(str, Enum):
    """Permission types."""

    AR = 'ar'
    AUDIO_CAPTURE = 'audioCapture'
    AUTOMATIC_FULLSCREEN = 'automaticFullscreen'
    BACKGROUND_FETCH = 'backgroundFetch'
    BACKGROUND_SYNC = 'backgroundSync'
    CAMERA_PAN_TILT_ZOOM = 'cameraPanTiltZoom'
    CAPTURED_SURFACE_CONTROL = 'capturedSurfaceControl'
    CLIPBOARD_READ_WRITE = 'clipboardReadWrite'
    CLIPBOARD_SANITIZED_WRITE = 'clipboardSanitizedWrite'
    DISPLAY_CAPTURE = 'displayCapture'
    DURABLE_STORAGE = 'durableStorage'
    GEOLOCATION = 'geolocation'
    HAND_TRACKING = 'handTracking'
    IDLE_DETECTION = 'idleDetection'
    KEYBOARD_LOCK = 'keyboardLock'
    LOCAL_FONTS = 'localFonts'
    LOCAL_NETWORK_ACCESS = 'localNetworkAccess'
    MIDI = 'midi'
    MIDI_SYSEX = 'midiSysex'
    NFC = 'nfc'
    NOTIFICATIONS = 'notifications'
    PAYMENT_HANDLER = 'paymentHandler'
    PERIODIC_BACKGROUND_SYNC = 'periodicBackgroundSync'
    POINTER_LOCK = 'pointerLock'
    PROTECTED_MEDIA_IDENTIFIER = 'protectedMediaIdentifier'
    SENSORS = 'sensors'
    SMART_CARD = 'smartCard'
    SPEAKER_SELECTION = 'speakerSelection'
    STORAGE_ACCESS = 'storageAccess'
    TOP_LEVEL_STORAGE_ACCESS = 'topLevelStorageAccess'
    VIDEO_CAPTURE = 'videoCapture'
    VR = 'vr'
    WAKE_LOCK_SCREEN = 'wakeLockScreen'
    WAKE_LOCK_SYSTEM = 'wakeLockSystem'
    WEB_APP_INSTALLATION = 'webAppInstallation'
    WEB_PRINTING = 'webPrinting'
    WINDOW_MANAGEMENT = 'windowManagement'


class PermissionSetting(str, Enum):
    """Permission setting values."""

    GRANTED = 'granted'
    DENIED = 'denied'
    PROMPT = 'prompt'


class PermissionDescriptor(TypedDict, total=False):
    """Definition of PermissionDescriptor defined in the Permissions API.

    See https://w3c.github.io/permissions/#dom-permissiondescriptor.
    """

    name: str  # Name of permission.
    sysex: bool  # For "midi" permission, may also specify sysex control.
    userVisibleOnly: bool  # For "push" permission, may specify userVisibleOnly.
    allowWithoutSanitization: (
        bool  # For "clipboard" permission, may specify allowWithoutSanitization.
    )
    allowWithoutGesture: bool  # For "fullscreen" permission, must specify allowWithoutGesture:true.
    panTiltZoom: bool  # For "camera" permission, may specify panTiltZoom.


class BrowserCommandId(str, Enum):
    """Browser command ids used by executeBrowserCommand."""

    OPEN_TAB_SEARCH = 'openTabSearch'
    CLOSE_TAB_SEARCH = 'closeTabSearch'
    OPEN_GLIC = 'openGlic'


class Bucket(TypedDict):
    """Chrome histogram bucket."""

    low: int  # Minimum value (inclusive).
    high: int  # Maximum value (exclusive).
    count: int  # Number of samples.


class Histogram(TypedDict):
    """Chrome histogram."""

    name: str  # Name.
    sum: int  # Sum of sample values.
    count: int  # Total number of samples.
    buckets: list['Bucket']  # Buckets.


class PrivacySandboxAPI(str, Enum):
    """Privacy Sandbox API types."""

    BIDDING_AND_AUCTION_SERVICES = 'BiddingAndAuctionServices'
    TRUSTED_KEY_VALUE = 'TrustedKeyValue'


================================================
FILE: pydoll/protocol/debugger/types.py
================================================
from typing_extensions import TypedDict


class SearchMatch(TypedDict):
    lineNumber: float
    lineContent: str


================================================
FILE: pydoll/protocol/dom/__init__.py
================================================
"""DOM domain implementation."""


================================================
FILE: pydoll/protocol/dom/events.py
================================================
from enum import Enum

from typing_extensions import TypedDict

from pydoll.protocol.base import CDPEvent
from pydoll.protocol.dom.types import BackendNode, Node, NodeId


class DomEvent(str, Enum):
    """
    Events from the DOM domain of the Chrome DevTools Protocol.

    This enumeration contains the names of DOM-related events that can be
    received from the Chrome DevTools Protocol. These events provide information
    about changes to the DOM structure, attributes, and other DOM-related activities.
    """

    ATTRIBUTE_MODIFIED = 'DOM.attributeModified'
    """
    Fired when Element's attribute is modified.

    Args:
        nodeId (NodeId): Id of the node that has changed.
        name (str): Attribute name.
        value (str): Attribute value.
    """

    ATTRIBUTE_REMOVED = 'DOM.attributeRemoved'
    """
    Fired when Element's attribute is removed.

    Args:
        nodeId (NodeId): Id of the node that has changed.
        name (str): Attribute name.
    """

    CHARACTER_DATA_MODIFIED = 'DOM.characterDataModified'
    """
    Mirrors DOMCharacterDataModified event.

    Args:
        nodeId (NodeId): Id of the node that has changed.
        characterData (str): New text value.
    """

    CHILD_NODE_COUNT_UPDATED = 'DOM.childNodeCountUpdated'
    """
    Fired when Container's child node count has changed.

    Args:
        nodeId (NodeId): Id of the node that has changed.
        childNodeCount (int): New node count.
    """

    CHILD_NODE_INSERTED = 'DOM.childNodeInserted'
    """
    Mirrors DOMNodeInserted event.

    Args:
        parentNodeId (NodeId): Id of the node that has changed.
        previousNodeId (NodeId): Id of the previous sibling.
        node (Node): Inserted node data.
    """

    CHILD_NODE_REMOVED = 'DOM.childNodeRemoved'
    """
    Mirrors DOMNodeRemoved event.

    Args:
        parentNodeId (NodeId): Parent id.
        nodeId (NodeId): Id of the node that has been removed.
    """

    DISTRIBUTED_NODES_UPDATED = 'DOM.distributedNodesUpdated'
    """
    Called when distribution is changed.

    Args:
        insertionPointId (NodeId): Insertion point where distributed nodes were updated.
        distributedNodes (array[BackendNode]): Distributed nodes for given insertion point.
    """

    DOCUMENT_UPDATED = 'DOM.documentUpdated'
    """
    Fired when Document has been totally updated. Node ids are no longer valid.
    """

    INLINE_STYLE_INVALIDATED = 'DOM.inlineStyleInvalidated'
    """
    Fired when Element's inline style is modified via a CSS property modification.

    Args:
        nodeIds (array[NodeId]): Ids of the nodes for which the inline styles have been invalidated.
    """

    PSEUDO_ELEMENT_ADDED = 'DOM.pseudoElementAdded'
    """
    Called when a pseudo element is added to an element.

    Args:
        parentId (NodeId): Pseudo element's parent element id.
        pseudoElement (Node): The added pseudo element.
    """

    PSEUDO_ELEMENT_REMOVED = 'DOM.pseudoElementRemoved'
    """
    Called when a pseudo element is removed from an element.

    Args:
        parentId (NodeId): Pseudo element's parent element id.
        pseudoElementId (NodeId): The removed pseudo element id.
    """

    SCROLLABLE_FLAG_UPDATED = 'DOM.scrollableFlagUpdated'
    """
    Fired when a node's scrollability state changes.

    Args:
        nodeId (DOM.NodeId): The id of the node.
        isScrollable (bool): If the node is scrollable.
    """

    SHADOW_ROOT_POPPED = 'DOM.shadowRootPopped'
    """
    Called when shadow root is popped from the element.

    Args:
        hostId (NodeId): Host element id.
        rootId (NodeId): Shadow root id.
    """

    SHADOW_ROOT_PUSHED = 'DOM.shadowRootPushed'
    """
    Called when shadow root is pushed into the element.

    Args:
        hostId (NodeId): Host element id.
        root (Node): Shadow root.
    """

    SET_CHILD_NODES = 'DOM.setChildNodes'
    """
    Fired when backend wants to provide client with the missing DOM structure.
    This happens upon most of the calls requesting node ids.

    Args:
        parentId (NodeId): Parent node id to populate with children.
        nodes (array[Node]): Child nodes array.
    """

    TOP_LAYER_ELEMENTS_UPDATED = 'DOM.topLayerElementsUpdated'
    """
    Called when top layer elements are changed.
    """


# Event parameter types
class AttributeModifiedEventParams(TypedDict):
    """Parameters for attributeModified event."""

    nodeId: NodeId
    name: str
    value: str


class AttributeRemovedEventParams(TypedDict):
    """Parameters for attributeRemoved event."""

    nodeId: NodeId
    name: str


class CharacterDataModifiedEventParams(TypedDict):
    """Parameters for characterDataModified event."""

    nodeId: NodeId
    characterData: str


class ChildNodeCountUpdatedEventParams(TypedDict):
    """Parameters for childNodeCountUpdated event."""

    nodeId: NodeId
    childNodeCount: int


class ChildNodeInsertedEventParams(TypedDict):
    """Parameters for childNodeInserted event."""

    parentNodeId: NodeId
    previousNodeId: NodeId
    node: Node


class ChildNodeRemovedEventParams(TypedDict):
    """Parameters for childNodeRemoved event."""

    parentNodeId: NodeId
    nodeId: NodeId


class DistributedNodesUpdatedEventParams(TypedDict):
    """Parameters for distributedNodesUpdated event."""

    insertionPointId: NodeId
    distributedNodes: list[BackendNode]


class DocumentUpdatedEventParams(TypedDict):
    """Parameters for documentUpdated event."""

    pass


class InlineStyleInvalidatedEventParams(TypedDict):
    """Parameters for inlineStyleInvalidated event."""

    nodeIds: list[NodeId]


class PseudoElementAddedEventParams(TypedDict):
    """Parameters for pseudoElementAdded event."""

    parentId: NodeId
    pseudoElement: Node


class PseudoElementRemovedEventParams(TypedDict):
    """Parameters for pseudoElementRemoved event."""

    parentId: NodeId
    pseudoElementId: NodeId


class ScrollableFlagUpdatedEventParams(TypedDict):
    """Parameters for scrollableFlagUpdated event."""

    nodeId: NodeId
    isScrollable: bool


class ShadowRootPoppedEventParams(TypedDict):
    """Parameters for shadowRootPopped event."""

    hostId: NodeId
    rootId: NodeId


class ShadowRootPushedEventParams(TypedDict):
    """Parameters for shadowRootPushed event."""

    hostId: NodeId
    root: Node


class SetChildNodesEventParams(TypedDict):
    """Parameters for setChildNodes event."""

    parentId: NodeId
    nodes: list[Node]


class TopLayerElementsUpdatedEventParams(TypedDict):
    """Parameters for topLayerElementsUpdated event."""

    pass


# Event types
AttributeModifiedEvent = CDPEvent[AttributeModifiedEventParams]
AttributeRemovedEvent = CDPEvent[AttributeRemovedEventParams]
CharacterDataModifiedEvent = CDPEvent[CharacterDataModifiedEventParams]
ChildNodeCountUpdatedEvent = CDPEvent[ChildNodeCountUpdatedEventParams]
ChildNodeInsertedEvent = CDPEvent[ChildNodeInsertedEventParams]
ChildNodeRemovedEvent = CDPEvent[ChildNodeRemovedEventParams]
DistributedNodesUpdatedEvent = CDPEvent[DistributedNodesUpdatedEventParams]
DocumentUpdatedEvent = CDPEvent[DocumentUpdatedEventParams]
InlineStyleInvalidatedEvent = CDPEvent[InlineStyleInvalidatedEventParams]
PseudoElementAddedEvent = CDPEvent[PseudoElementAddedEventParams]
PseudoElementRemovedEvent = CDPEvent[PseudoElementRemovedEventParams]
ScrollableFlagUpdatedEvent = CDPEvent[ScrollableFlagUpdatedEventParams]
ShadowRootPoppedEvent = CDPEvent[ShadowRootPoppedEventParams]
ShadowRootPushedEvent = CDPEvent[ShadowRootPushedEventParams]
SetChildNodesEvent = CDPEvent[SetChildNodesEventParams]
TopLayerElementsUpdatedEvent = CDPEvent[TopLayerElementsUpdatedEventParams]


================================================
FILE: pydoll/protocol/dom/methods.py
================================================
from enum import Enum

from typing_extensions import TypedDict

from pydoll.protocol.base import Command, EmptyParams, EmptyResponse, Response
from pydoll.protocol.dom.types import (
    BackendNodeId,
    BoxModel,
    CSSComputedStyleProperty,
    DetachedElementInfo,
    IncludeWhitespace,
    LogicalAxes,
    Node,
    NodeId,
    PhysicalAxes,
    Quad,
    Rect,
    RelationType,
)
from pydoll.protocol.page.types import FrameId
from pydoll.protocol.runtime.types import (
    ExecutionContextId,
    RemoteObject,
    RemoteObjectId,
    StackTrace,
)


class DomMethod(str, Enum):
    """DOM domain method names."""

    COLLECT_CLASS_NAMES_FROM_SUBTREE = 'DOM.collectClassNamesFromSubtree'
    COPY_TO = 'DOM.copyTo'
    DESCRIBE_NODE = 'DOM.describeNode'
    DISABLE = 'DOM.disable'
    DISCARD_SEARCH_RESULTS = 'DOM.discardSearchResults'
    ENABLE = 'DOM.enable'
    FOCUS = 'DOM.focus'
    FORCE_SHOW_POPOVER = 'DOM.forceShowPopover'
    GET_ANCHOR_ELEMENT = 'DOM.getAnchorElement'
    GET_ATTRIBUTES = 'DOM.getAttributes'
    GET_BOX_MODEL = 'DOM.getBoxModel'
    GET_CONTAINER_FOR_NODE = 'DOM.getContainerForNode'
    GET_CONTENT_QUADS = 'DOM.getContentQuads'
    GET_DETACHED_DOM_NODES = 'DOM.getDetachedDomNodes'
    GET_DOCUMENT = 'DOM.getDocument'
    GET_ELEMENT_BY_RELATION = 'DOM.getElementByRelation'
    GET_FILE_INFO = 'DOM.getFileInfo'
    GET_FLATTENED_DOCUMENT = 'DOM.getFlattenedDocument'
    GET_FRAME_OWNER = 'DOM.getFrameOwner'
    GET_NODE_FOR_LOCATION = 'DOM.getNodeForLocation'
    GET_NODE_STACK_TRACES = 'DOM.getNodeStackTraces'
    GET_NODES_FOR_SUBTREE_BY_STYLE = 'DOM.getNodesForSubtreeByStyle'
    GET_OUTER_HTML = 'DOM.getOuterHTML'
    GET_QUERYING_DESCENDANTS_FOR_CONTAINER = 'DOM.getQueryingDescendantsForContainer'
    GET_RELAYOUT_BOUNDARY = 'DOM.getRelayoutBoundary'
    GET_SEARCH_RESULTS = 'DOM.getSearchResults'
    GET_TOP_LAYER_ELEMENTS = 'DOM.getTopLayerElements'
    HIDE_HIGHLIGHT = 'DOM.hideHighlight'
    HIGHLIGHT_NODE = 'DOM.highlightNode'
    HIGHLIGHT_RECT = 'DOM.highlightRect'
    MARK_UNDOABLE_STATE = 'DOM.markUndoableState'
    MOVE_TO = 'DOM.moveTo'
    PERFORM_SEARCH = 'DOM.performSearch'
    PUSH_NODE_BY_PATH_TO_FRONTEND = 'DOM.pushNodeByPathToFrontend'
    PUSH_NODES_BY_BACKEND_IDS_TO_FRONTEND = 'DOM.pushNodesByBackendIdsToFrontend'
    QUERY_SELECTOR = 'DOM.querySelector'
    QUERY_SELECTOR_ALL = 'DOM.querySelectorAll'
    REDO = 'DOM.redo'
    REMOVE_ATTRIBUTE = 'DOM.removeAttribute'
    REMOVE_NODE = 'DOM.removeNode'
    REQUEST_CHILD_NODES = 'DOM.requestChildNodes'
    REQUEST_NODE = 'DOM.requestNode'
    RESOLVE_NODE = 'DOM.resolveNode'
    SCROLL_INTO_VIEW_IF_NEEDED = 'DOM.scrollIntoViewIfNeeded'
    SET_ATTRIBUTE_VALUE = 'DOM.setAttributeValue'
    SET_ATTRIBUTES_AS_TEXT = 'DOM.setAttributesAsText'
    SET_FILE_INPUT_FILES = 'DOM.setFileInputFiles'
    SET_INSPECTED_NODE = 'DOM.setInspectedNode'
    SET_NODE_NAME = 'DOM.setNodeName'
    SET_NODE_STACK_TRACES_ENABLED = 'DOM.setNodeStackTracesEnabled'
    SET_NODE_VALUE = 'DOM.setNodeValue'
    SET_OUTER_HTML = 'DOM.setOuterHTML'
    UNDO = 'DOM.undo'


class CollectClassNamesFromSubtreeParams(TypedDict):
    """Parameters for collecting class names from subtree."""

    nodeId: NodeId


class CopyToParams(TypedDict, total=False):
    """Parameters for copying a node."""

    nodeId: NodeId
    targetNodeId: NodeId
    insertBeforeNodeId: NodeId


class DescribeNodeParams(TypedDict, total=False):
    """Parameters for describing a node."""

    nodeId: NodeId
    backendNodeId: BackendNodeId
    objectId: RemoteObjectId
    depth: int
    pierce: bool


class ScrollIntoViewIfNeededParams(TypedDict, total=False):
    """Parameters for scrolling into view if needed."""

    nodeId: NodeId
    backendNodeId: BackendNodeId
    objectId: RemoteObjectId
    rect: Rect


class DiscardSearchResultsParams(TypedDict):
    """Parameters for discarding search results."""

    searchId: str


class EnableParams(TypedDict, total=False):
    """Parameters for enabling DOM agent."""

    includeWhitespace: IncludeWhitespace


class FocusParams(TypedDict, total=False):
    """Parameters for focusing an element."""

    nodeId: NodeId
    backendNodeId: BackendNodeId
    objectId: RemoteObjectId


class GetAttributesParams(TypedDict):
    """Parameters for getting attributes."""

    nodeId: NodeId


class GetBoxModelParams(TypedDict, total=False):
    """Parameters for getting box model."""

    nodeId: NodeId
    backendNodeId: BackendNodeId
    objectId: RemoteObjectId


class GetContentQuadsParams(TypedDict, total=False):
    """Parameters for getting content quads."""

    nodeId: NodeId
    backendNodeId: BackendNodeId
    objectId: RemoteObjectId


class GetDocumentParams(TypedDict, total=False):
    """Parameters for getting document."""

    depth: int
    pierce: bool


class GetFlattenedDocumentParams(TypedDict, total=False):
    """Parameters for getting flattened document."""

    depth: int
    pierce: bool


class GetNodesForSubtreeByStyleParams(TypedDict, total=False):
    """Parameters for getting nodes by style."""

    nodeId: NodeId
    computedStyles: list[CSSComputedStyleProperty]
    pierce: bool


class GetNodeForLocationParams(TypedDict, total=False):
    """Parameters for getting node for location."""

    x: int
    y: int
    includeUserAgentShadowDOM: bool
    ignorePointerEventsNone: bool


class GetOuterHTMLParams(TypedDict, total=False):
    """Parameters for getting outer HTML."""

    nodeId: NodeId
    backendNodeId: BackendNodeId
    objectId: RemoteObjectId
    includeShadowDOM: bool


class GetRelayoutBoundaryParams(TypedDict):
    """Parameters for getting relayout boundary."""

    nodeId: NodeId


class GetSearchResultsParams(TypedDict):
    """Parameters for getting search results."""

    searchId: str
    fromIndex: int
    toIndex: int


class MoveToParams(TypedDict, total=False):
    """Parameters for moving a node."""

    nodeId: NodeId
    targetNodeId: NodeId
    insertBeforeNodeId: NodeId


class PerformSearchParams(TypedDict, total=False):
    """Parameters for performing search."""

    query: str
    includeUserAgentShadowDOM: bool


class PushNodeByPathToFrontendParams(TypedDict):
    """Parameters for pushing node by path to frontend."""

    path: str


class PushNodesByBackendIdsToFrontendParams(TypedDict):
    """Parameters for pushing nodes by backend IDs to frontend."""

    backendNodeIds: list[BackendNodeId]


class QuerySelectorParams(TypedDict):
    """Parameters for querySelector."""

    nodeId: NodeId
    selector: str


class QuerySelectorAllParams(TypedDict):
    """Parameters for querySelectorAll."""

    nodeId: NodeId
    selector: str


class GetElementByRelationParams(TypedDict):
    """Parameters for getting element by relation."""

    nodeId: NodeId
    relation: RelationType


class RemoveAttributeParams(TypedDict):
    """Parameters for removing attribute."""

    nodeId: NodeId
    name: str


class RemoveNodeParams(TypedDict):
    """Parameters for removing node."""

    nodeId: NodeId


class RequestChildNodesParams(TypedDict, total=False):
    """Parameters for requesting child nodes."""

    nodeId: NodeId
    depth: int
    pierce: bool


class RequestNodeParams(TypedDict):
    """Parameters for requesting node."""

    objectId: RemoteObjectId


class ResolveNodeParams(TypedDict, total=False):
    """Parameters for resolving node."""

    nodeId: NodeId
    backendNodeId: BackendNodeId
    objectGroup: str
    executionContextId: ExecutionContextId


class SetAttributeValueParams(TypedDict):
    """Parameters for setting attribute value."""

    nodeId: NodeId
    name: str
    value: str


class SetAttributesAsTextParams(TypedDict, total=False):
    """Parameters for setting attributes as text."""

    nodeId: NodeId
    text: str
    name: str


class SetFileInputFilesParams(TypedDict, total=False):
    """Parameters for setting file input files."""

    files: list[str]
    nodeId: NodeId
    backendNodeId: BackendNodeId
    objectId: RemoteObjectId


class SetNodeStackTracesEnabledParams(TypedDict):
    """Parameters for setting node stack traces enabled."""

    enable: bool


class GetNodeStackTracesParams(TypedDict):
    """Parameters for getting node stack traces."""

    nodeId: NodeId


class GetFileInfoParams(TypedDict):
    """Parameters for getting file info."""

    objectId: RemoteObjectId


class SetInspectedNodeParams(TypedDict):
    """Parameters for setting inspected node."""

    nodeId: NodeId


class SetNodeNameParams(TypedDict):
    """Parameters for setting node name."""

    nodeId: NodeId
    name: str


class SetNodeValueParams(TypedDict):
    """Parameters for setting node value."""

    nodeId: NodeId
    value: str


class SetOuterHTMLParams(TypedDict):
    """Parameters for setting outer HTML."""

    nodeId: NodeId
    outerHTML: str


class GetFrameOwnerParams(TypedDict):
    """Parameters for getting frame owner."""

    frameId: FrameId


class GetContainerForNodeParams(TypedDict, total=False):
    """Parameters for getting container for node."""

    nodeId: NodeId
    containerName: str
    physicalAxes: PhysicalAxes
    logicalAxes: LogicalAxes
    queriesScrollState: bool
    queriesAnchored: bool


class GetQueryingDescendantsForContainerParams(TypedDict):
    """Parameters for getting querying descendants for container."""

    nodeId: NodeId


class GetAnchorElementParams(TypedDict, total=False):
    """Parameters for getting anchor element."""

    nodeId: NodeId
    anchorSpecifier: str


class ForceShowPopoverParams(TypedDict):
    """Parameters for forcing show popover."""

    nodeId: NodeId
    enable: bool


# Result types
class CollectClassNamesFromSubtreeResult(TypedDict):
    """Result for collectClassNamesFromSubtree command."""

    classNames: list[str]


class CopyToResult(TypedDict):
    """Result for copyTo command."""

    nodeId: NodeId


class DescribeNodeResult(TypedDict):
    """Result for describeNode command."""

    node: Node


class GetAttributesResult(TypedDict):
    """Result for getAttributes command."""

    attributes: list[str]


class GetBoxModelResult(TypedDict):
    """Result for getBoxModel command."""

    model: BoxModel


class GetContentQuadsResult(TypedDict):
    """Result for getContentQuads command."""

    quads: list[Quad]


class GetDocumentResult(TypedDict):
    """Result for getDocument command."""

    root: Node


class GetFlattenedDocumentResult(TypedDict):
    """Result for getFlattenedDocument command."""

    nodes: list[Node]


class GetNodesForSubtreeByStyleResult(TypedDict):
    """Result for getNodesForSubtreeByStyle command."""

    nodeIds: list[NodeId]


class GetNodeForLocationResult(TypedDict, total=False):
    """Result for getNodeForLocation command."""

    backendNodeId: BackendNodeId
    frameId: FrameId
    nodeId: NodeId


class GetOuterHTMLResult(TypedDict):
    """Result for getOuterHTML command."""

    outerHTML: str


class GetRelayoutBoundaryResult(TypedDict):
    """Result for getRelayoutBoundary command."""

    nodeId: NodeId


class GetSearchResultsResult(TypedDict):
    """Result for getSearchResults command."""

    nodeIds: list[NodeId]


class GetTopLayerElementsResult(TypedDict):
    """Result for getTopLayerElements command."""

    nodeIds: list[NodeId]


class GetElementByRelationResult(TypedDict):
    """Result for getElementByRelation command."""

    nodeId: NodeId


class MoveToResult(TypedDict):
    """Result for moveTo command."""

    nodeId: NodeId


class PerformSearchResult(TypedDict):
    """Result for performSearch command."""

    searchId: str
    resultCount: int


class PushNodeByPathToFrontendResult(TypedDict):
    """Result for pushNodeByPathToFrontend command."""

    nodeId: NodeId


class PushNodesByBackendIdsToFrontendResult(TypedDict):
    """Result for pushNodesByBackendIdsToFrontend command."""

    nodeIds: list[NodeId]


class QuerySelectorResult(TypedDict):
    """Result for querySelector command."""

    nodeId: NodeId


class QuerySelectorAllResult(TypedDict):
    """Result for querySelectorAll command."""

    nodeIds: list[NodeId]


class RequestNodeResult(TypedDict):
    """Result for requestNode command."""

    nodeId: NodeId


class ResolveNodeResult(TypedDict):
    """Result for resolveNode command."""

    object: RemoteObject


class SetNodeNameResult(TypedDict):
    """Result for setNodeName command."""

    nodeId: NodeId


class GetNodeStackTracesResult(TypedDict, total=False):
    """Result for getNodeStackTraces command."""

    creation: StackTrace


class GetFileInfoResult(TypedDict):
    """Result for getFileInfo command."""

    path: str


class GetDetachedDomNodesResult(TypedDict):
    """Result for getDetachedDomNodes command."""

    detachedNodes: list[DetachedElementInfo]


class GetFrameOwnerResult(TypedDict, total=False):
    """Result for getFrameOwner command."""

    backendNodeId: BackendNodeId
    nodeId: NodeId


class GetContainerForNodeResult(TypedDict, total=False):
    """Result for getContainerForNode command."""

    nodeId: NodeId


class GetQueryingDescendantsForContainerResult(TypedDict):
    """Result for getQueryingDescendantsForContainer command."""

    nodeIds: list[NodeId]


class GetAnchorElementResult(TypedDict):
    """Result for getAnchorElement command."""

    nodeId: NodeId


class ForceShowPopoverResult(TypedDict):
    """Result for forceShowPopover command."""

    nodeIds: list[NodeId]


# Response types
CollectClassNamesFromSubtreeResponse = Response[CollectClassNamesFromSubtreeResult]
CopyToResponse = Response[CopyToResult]
DescribeNodeResponse = Response[DescribeNodeResult]
GetAttributesResponse = Response[GetAttributesResult]
GetBoxModelResponse = Response[GetBoxModelResult]
GetContentQuadsResponse = Response[GetContentQuadsResult]
GetDocumentResponse = Response[GetDocumentResult]
GetFlattenedDocumentResponse = Response[GetFlattenedDocumentResult]
GetNodesForSubtreeByStyleResponse = Response[GetNodesForSubtreeByStyleResult]
GetNodeForLocationResponse = Response[GetNodeForLocationResult]
GetOuterHTMLResponse = Response[GetOuterHTMLResult]
GetRelayoutBoundaryResponse = Response[GetRelayoutBoundaryResult]
GetSearchResultsResponse = Response[GetSearchResultsResult]
GetTopLayerElementsResponse = Response[GetTopLayerElementsResult]
GetElementByRelationResponse = Response[GetElementByRelationResult]
MoveToResponse = Response[MoveToResult]
PerformSearchResponse = Response[PerformSearchResult]
PushNodeByPathToFrontendResponse = Response[PushNodeByPathToFrontendResult]
PushNodesByBackendIdsToFrontendResponse = Response[PushNodesByBackendIdsToFrontendResult]
QuerySelectorResponse = Response[QuerySelectorResult]
QuerySelectorAllResponse = Response[QuerySelectorAllResult]
RequestNodeResponse = Response[RequestNodeResult]
ResolveNodeResponse = Response[ResolveNodeResult]
SetNodeNameResponse = Response[SetNodeNameResult]
GetNodeStackTracesResponse = Response[GetNodeStackTracesResult]
GetFileInfoResponse = Response[GetFileInfoResult]
GetDetachedDomNodesResponse = Response[GetDetachedDomNodesResult]
GetFrameOwnerResponse = Response[GetFrameOwnerResult]
GetContainerForNodeResponse = Response[GetContainerForNodeResult]
GetQueryingDescendantsForContainerResponse = Response[GetQueryingDescendantsForContainerResult]
GetAnchorElementResponse = Response[GetAnchorElementResult]
ForceShowPopoverResponse = Response[ForceShowPopoverResult]


# Command types
CollectClassNamesFromSubtreeCommand = Command[
    CollectClassNamesFromSubtreeParams, CollectClassNamesFromSubtreeResponse
]
CopyToCommand = Command[CopyToParams, CopyToResponse]
DescribeNodeCommand = Command[DescribeNodeParams, DescribeNodeResponse]
DisableCommand = Command[EmptyParams, Response[EmptyResponse]]
DiscardSearchResultsCommand = Command[DiscardSearchResultsParams, Response[EmptyResponse]]
EnableCommand = Command[EnableParams, Response[EmptyResponse]]
FocusCommand = Command[FocusParams, Response[EmptyResponse]]
ForceShowPopoverCommand = Command[ForceShowPopoverParams, ForceShowPopoverResponse]
GetAnchorElementCommand = Command[GetAnchorElementParams, GetAnchorElementResponse]
GetAttributesCommand = Command[GetAttributesParams, GetAttributesResponse]
GetBoxModelCommand = Command[GetBoxModelParams, GetBoxModelResponse]
GetContainerForNodeCommand = Command[GetContainerForNodeParams, GetContainerForNodeResponse]
GetContentQuadsCommand = Command[GetContentQuadsParams, GetContentQuadsResponse]
GetDetachedDomNodesCommand = Command[EmptyParams, Response[GetDetachedDomNodesResponse]]
GetDocumentCommand = Command[GetDocumentParams, GetDocumentResponse]
GetElementByRelationCommand = Command[GetElementByRelationParams, GetElementByRelationResponse]
GetFileInfoCommand = Command[GetFileInfoParams, GetFileInfoResponse]
GetFlattenedDocumentCommand = Command[GetFlattenedDocumentParams, GetFlattenedDocumentResponse]
GetFrameOwnerCommand = Command[GetFrameOwnerParams, GetFrameOwnerResponse]
GetNodeForLocationCommand = Command[GetNodeForLocationParams, GetNodeForLocationResponse]
GetNodeStackTracesCommand = Command[GetNodeStackTracesParams, GetNodeStackTracesResponse]
GetNodesForSubtreeByStyleCommand = Command[
    GetNodesForSubtreeByStyleParams, GetNodesForSubtreeByStyleResponse
]
GetOuterHTMLCommand = Command[GetOuterHTMLParams, GetOuterHTMLResponse]
GetQueryingDescendantsForContainerCommand = Command[
    GetQueryingDescendantsForContainerParams, GetQueryingDescendantsForContainerResponse
]
GetRelayoutBoundaryCommand = Command[GetRelayoutBoundaryParams, GetRelayoutBoundaryResponse]
GetSearchResultsCommand = Command[GetSearchResultsParams, GetSearchResultsResponse]
GetTopLayerElementsCommand = Command[EmptyParams, GetTopLayerElementsResponse]
HideHighlightCommand = Command[EmptyParams, Response[EmptyResponse]]
HighlightNodeCommand = Command[EmptyParams, Response[EmptyResponse]]  # redirect to Overlay
HighlightRectCommand = Command[EmptyParams, Response[EmptyResponse]]  # redirect to Overlay
MarkUndoableStateCommand = Command[EmptyParams, Response[EmptyResponse]]
MoveToCommand = Command[MoveToParams, MoveToResponse]
PerformSearchCommand = Command[PerformSearchParams, PerformSearchResponse]
PushNodeByPathToFrontendCommand = Command[
    PushNodeByPathToFrontendParams, PushNodeByPathToFrontendResponse
]
PushNodesByBackendIdsToFrontendCommand = Command[
    PushNodesByBackendIdsToFrontendParams, PushNodesByBackendIdsToFrontendResponse
]
QuerySelectorCommand = Command[QuerySelectorParams, QuerySelectorResponse]
QuerySelectorAllCommand = Command[QuerySelectorAllParams, QuerySelectorAllResponse]
RedoCommand = Command[EmptyParams, Response[EmptyResponse]]
RemoveAttributeCommand = Command[RemoveAttributeParams, Response[EmptyResponse]]
RemoveNodeCommand = Command[RemoveNodeParams, Response[EmptyResponse]]
RequestChildNodesCommand = Command[RequestChildNodesParams, Response[EmptyResponse]]
RequestNodeCommand = Command[RequestNodeParams, RequestNodeResponse]
ResolveNodeCommand = Command[ResolveNodeParams, ResolveNodeResponse]
ScrollIntoViewIfNeededCommand = Command[ScrollIntoViewIfNeededParams, Response[EmptyResponse]]
SetAttributeValueCommand = Command[SetAttributeValueParams, Response[EmptyResponse]]
SetAttributesAsTextCommand = Command[SetAttributesAsTextParams, Response[EmptyResponse]]
SetFileInputFilesCommand = Command[SetFileInputFilesParams, Response[EmptyResponse]]
SetInspectedNodeCommand = Command[SetInspectedNodeParams, Response[EmptyResponse]]
SetNodeNameCommand = Command[SetNodeNameParams, SetNodeNameResponse]
SetNodeStackTracesEnabledCommand = Command[SetNodeStackTracesEnabledParams, Response[EmptyResponse]]
SetNodeValueCommand = Command[SetNodeValueParams, Response[EmptyResponse]]
SetOuterHTMLCommand = Command[SetOuterHTMLParams, Response[EmptyResponse]]
UndoCommand = Command[EmptyParams, Response[EmptyResponse]]


================================================
FILE: pydoll/protocol/dom/types.py
================================================
from enum import Enum
from typing import Annotated, Any

from typing_extensions import TypedDict

NodeId = int
BackendNodeId = int
Quad = Annotated[list[float], 'Format: [x1, y1, x2, y2, x3, y3, x4, y4]']


class PseudoType(str, Enum):
    """Pseudo element type."""

    FIRST_LINE = 'first-line'
    FIRST_LETTER = 'first-letter'
    CHECKMARK = 'checkmark'
    BEFORE = 'before'
    AFTER = 'after'
    PICKER_ICON = 'picker-icon'
    MARKER = 'marker'
    BACKDROP = 'backdrop'
    COLUMN = 'column'
    SELECTION = 'selection'
    SEARCH_TEXT = 'search-text'
    TARGET_TEXT = 'target-text'
    SPELLING_ERROR = 'spelling-error'
    GRAMMAR_ERROR = 'grammar-error'
    HIGHLIGHT = 'highlight'
    FIRST_LINE_INHERITED = 'first-line-inherited'
    SCROLL_MARKER = 'scroll-marker'
    SCROLL_MARKER_GROUP = 'scroll-marker-group'
    SCROLL_BUTTON = 'scroll-button'
    SCROLLBAR = 'scrollbar'
    SCROLLBAR_THUMB = 'scrollbar-thumb'
    SCROLLBAR_BUTTON = 'scrollbar-button'
    SCROLLBAR_TRACK = 'scrollbar-track'
    SCROLLBAR_TRACK_PIECE = 'scrollbar-track-piece'
    SCROLLBAR_CORNER = 'scrollbar-corner'
    RESIZER = 'resizer'
    INPUT_LIST_BUTTON = 'input-list-button'
    VIEW_TRANSITION = 'view-transition'
    VIEW_TRANSITION_GROUP = 'view-transition-group'
    VIEW_TRANSITION_IMAGE_PAIR = 'view-transition-image-pair'
    VIEW_TRANSITION_GROUP_CHILDREN = 'view-transition-group-children'
    VIEW_TRANSITION_OLD = 'view-transition-old'
    VIEW_TRANSITION_NEW = 'view-transition-new'
    PLACEHOLDER = 'placeholder'
    FILE_SELECTOR_BUTTON = 'file-selector-button'
    DETAILS_CONTENT = 'details-content'
    PICKER = 'picker'
    PERMISSION_ICON = 'permission-icon'


class ShadowRootType(str, Enum):
    """Shadow root type."""

    USER_AGENT = 'user-agent'
    OPEN = 'open'
    CLOSED = 'closed'


class CompatibilityMode(str, Enum):
    """Document compatibility mode."""

    QUIRKS_MODE = 'QuirksMode'
    LIMITED_QUIRKS_MODE = 'LimitedQuirksMode'
    NO_QUIRKS_MODE = 'NoQuirksMode'


class PhysicalAxes(str, Enum):
    """ContainerSelector physical axes."""

    HORIZONTAL = 'Horizontal'
    VERTICAL = 'Vertical'
    BOTH = 'Both'


class LogicalAxes(str, Enum):
    """ContainerSelector logical axes."""

    INLINE = 'Inline'
    BLOCK = 'Block'
    BOTH = 'Both'


class ScrollOrientation(str, Enum):
    """Physical scroll orientation."""

    HORIZONTAL = 'horizontal'
    VERTICAL = 'vertical'


class IncludeWhitespace(str, Enum):
    """Include whitespace options."""

    NONE = 'none'
    ALL = 'all'


class RelationType(str, Enum):
    """Element relation types."""

    POPOVER_TARGET = 'PopoverTarget'
    INTEREST_TARGET = 'InterestTarget'
    COMMAND_FOR = 'CommandFor'


class BackendNode(TypedDict):
    """Backend node with a friendly name."""

    nodeType: int
    nodeName: str
    backendNodeId: BackendNodeId


class Node(TypedDict, total=False):
    """DOM interaction is implemented in terms of mirror objects that represent the actual DOM
    nodes."""

    nodeId: NodeId
    parentId: NodeId
    backendNodeId: BackendNodeId
    nodeType: int
    nodeName: str
    localName: str
    nodeValue: str
    childNodeCount: int
    children: list['Node']
    attributes: list[str]
    documentURL: str
    baseURL: str
    publicId: str
    systemId: str
    internalSubset: str
    xmlVersion: str
    name: str
    value: str
    pseudoType: PseudoType
    pseudoIdentifier: str
    shadowRootType: ShadowRootType
    frameId: str
    contentDocument: 'Node'
    shadowRoots: list['Node']
    templateContent: 'Node'
    pseudoElements: list['Node']
    importedDocument: 'Node'  # deprecated
    distributedNodes: list[BackendNode]
    isSVG: bool
    compatibilityMode: CompatibilityMode
    assignedSlot: BackendNode
    isScrollable: bool


class DetachedElementInfo(TypedDict):
    """A structure to hold the top-level node of a detached tree and an array of its retained
    descendants."""

    treeNode: Node
    retainedNodeIds: list[NodeId]


class RGBA(TypedDict, total=False):
    """A structure holding an RGBA color."""

    r: int  # The red component, in the [0-255] range.
    g: int  # The green component, in the [0-255] range.
    b: int  # The blue component, in the [0-255] range.
    a: float  # The alpha component, in the [0-1] range (default: 1).


class BoxModel(TypedDict, total=False):
    """Box model."""

    content: Quad
    padding: Quad
    border: Quad
    margin: Quad
    width: int
    height: int
    shapeOutside: 'ShapeOutsideInfo'


class ShapeOutsideInfo(TypedDict):
    """CSS Shape Outside details."""

    bounds: Quad
    shape: list[Any]
    marginShape: list[Any]


class Rect(TypedDict):
    """Rectangle."""

    x: float
    y: float
    width: float
    height: float


class CSSComputedStyleProperty(TypedDict):
    """CSS computed style property."""

    name: str
    value: str


================================================
FILE: pydoll/protocol/emulation/__init__.py
================================================
"""Emulation domain implementation."""


================================================
FILE: pydoll/protocol/emulation/methods.py
================================================
from enum import Enum

from typing_extensions import NotRequired, TypedDict

from pydoll.protocol.base import Command, EmptyResponse, Response
from pydoll.protocol.emulation.types import UserAgentMetadata


class EmulationMethod(str, Enum):
    SET_USER_AGENT_OVERRIDE = 'Emulation.setUserAgentOverride'


class SetUserAgentOverrideParams(TypedDict):
    """Parameters for overriding user agent string.

    See https://chromedevtools.github.io/devtools-protocol/tot/Emulation/#method-setUserAgentOverride
    """

    userAgent: str
    acceptLanguage: NotRequired[str]
    platform: NotRequired[str]
    userAgentMetadata: NotRequired[UserAgentMetadata]


SetUserAgentOverrideCommand = Command[SetUserAgentOverrideParams, Response[EmptyResponse]]


================================================
FILE: pydoll/protocol/emulation/types.py
================================================
from enum import Enum

from typing_extensions import NotRequired, TypedDict


class ScreenOrientationType(str, Enum):
    """Orientation type."""

    PORTRAIT_PRIMARY = 'portraitPrimary'
    PORTRAIT_SECONDARY = 'portraitSecondary'
    LANDSCAPE_PRIMARY = 'landscapePrimary'
    LANDSCAPE_SECONDARY = 'landscapeSecondary'


class DisplayFeatureOrientation(str, Enum):
    """Orientation of a display feature in relation to screen."""

    VERTICAL = 'vertical'
    HORIZONTAL = 'horizontal'


class DevicePostureType(str, Enum):
    """Current posture of the device."""

    CONTINUOUS = 'continuous'
    FOLDED = 'folded'


class VirtualTimePolicy(str, Enum):
    """advance: If the scheduler runs out of immediate work, the virtual time base may fast forward
    to allow the next delayed task (if any) to run; pause: The virtual time base may not advance;
    pauseIfNetworkFetchesPending: The virtual time base may not advance if there are any pending
    resource fetches."""

    ADVANCE = 'advance'
    PAUSE = 'pause'
    PAUSE_IF_NETWORK_FETCHES_PENDING = 'pauseIfNetworkFetchesPending'


class SensorType(str, Enum):
    """Used to specify sensor types to emulate.
    See https://w3c.github.io/sensors/#automation for more information."""

    ABSOLUTE_ORIENTATION = 'absolute-orientation'
    ACCELEROMETER = 'accelerometer'
    AMBIENT_LIGHT = 'ambient-light'
    GRAVITY = 'gravity'
    GYROSCOPE = 'gyroscope'
    LINEAR_ACCELERATION = 'linear-acceleration'
    MAGNETOMETER = 'magnetometer'
    RELATIVE_ORIENTATION = 'relative-orientation'


class PressureSource(str, Enum):
    """Pressure source type."""

    CPU = 'cpu'


class PressureState(str, Enum):
    """Pressure state."""

    NOMINAL = 'nominal'
    FAIR = 'fair'
    SERIOUS = 'serious'
    CRITICAL = 'critical'


class DisabledImageType(str, Enum):
    """Enum of image types that can be disabled."""

    AVIF = 'avif'
    WEBP = 'webp'


class SafeAreaInsets(TypedDict, total=False):
    """Safe area insets configuration."""

    top: int  # Overrides safe-area-inset-top
    topMax: int  # Overrides safe-area-max-inset-top
    left: int  # Overrides safe-area-inset-left
    leftMax: int  # Overrides safe-area-max-inset-left
    bottom: int  # Overrides safe-area-inset-bottom
    bottomMax: int  # Overrides safe-area-max-inset-bottom
    right: int  # Overrides safe-area-inset-right
    rightMax: int  # Overrides safe-area-max-inset-right


class ScreenOrientation(TypedDict):
    """Screen orientation."""

    type: ScreenOrientationType  # Orientation type
    angle: int  # Orientation angle


class DisplayFeature(TypedDict):
    """Display feature configuration."""

    # Orientation of a display feature in relation to screen
    orientation: DisplayFeatureOrientation
    # The offset from the screen origin in either the x or y
    offset: int
    # A display feature may mask content such that it is not physically displayed
    # this length along with the offset describes this area. A display feature that only split
    # content will have a 0 mask_length
    maskLength: int


class DevicePosture(TypedDict):
    """Device posture configuration."""

    type: DevicePostureType  # Current posture of the device


class MediaFeature(TypedDict):
    """Media feature configuration."""

    name: str
    value: str


class UserAgentBrandVersion(TypedDict):
    """Used to specify User Agent Client Hints to emulate.
    See https://wicg.github.io/ua-client-hints"""

    brand: str
    version: str


class UserAgentMetadata(TypedDict):
    """Used to specify User Agent Client Hints to emulate.
    See https://wicg.github.io/ua-client-hints
    Missing optional values will be filled in by the target with what it would normally use."""

    platform: str
    platformVersion: str
    architecture: str
    model: str
    mobile: bool
    brands: NotRequired[list[UserAgentBrandVersion]]  # Brands appearing in Sec-CH-UA
    fullVersionList: NotRequired[
        list[UserAgentBrandVersion]
    ]  # Brands appearing in Sec-CH-UA-Full-Version-List
    fullVersion: NotRequired[str]  # deprecated
    bitness: NotRequired[str]
    wow64: NotRequired[bool]
    formFactors: NotRequired[list[str]]  # Used to specify User Agent form-factor values.
    # See https://wicg.github.io/ua-client-hints/#sec-ch-ua-form-factors


class SensorMetadata(TypedDict, total=False):
    """Sensor metadata configuration."""

    available: bool
    minimumFrequency: float
    maximumFrequency: float


class SensorReadingSingle(TypedDict):
    """Single sensor reading value."""

    value: float


class SensorReadingXYZ(TypedDict):
    """XYZ sensor reading values."""

    x: float
    y: float
    z: float


class SensorReadingQuaternion(TypedDict):
    """Quaternion sensor reading values."""

    x: float
    y: float
    z: float
    w: float


class SensorReading(TypedDict, total=False):
    """Sensor reading configuration."""

    single: 'SensorReadingSingle'
    xyz: 'SensorReadingXYZ'
    quaternion: 'SensorReadingQuaternion'


class PressureMetadata(TypedDict, total=False):
    """Pressure metadata configuration."""

    available: bool


================================================
FILE: pydoll/protocol/fetch/__init__.py
================================================
"""Fetch domain implementation."""


================================================
FILE: pydoll/protocol/fetch/events.py
================================================
from enum import Enum

from typing_extensions import TypedDict

from pydoll.protocol.base import CDPEvent
from pydoll.protocol.fetch.types import AuthChallenge
from pydoll.protocol.network.types import ErrorReason, Request, ResourceType


class FetchEvent(str, Enum):
    """
    Events from the Fetch domain of the Chrome DevTools Protocol.

    This enumeration contains the names of Fetch-related events that can be
    received from the Chrome DevTools Protocol. These events provide information
    about network requests that can be intercepted, modified, or responded to
    by the client.
    """

    AUTH_REQUIRED = 'Fetch.authRequired'
    """
    Issued when the domain is enabled with handleAuthRequests set to true.
    The request is paused until client responds with continueWithAuth.

    Args:
        requestId (RequestId): Each request the page makes will have a unique id.
        request (Network.Request): The details of the request.
        frameId (Page.FrameId): The id of the frame that initiated the request.
        resourceType (Network.ResourceType): How the requested resource will be used.
        authChallenge (AuthChallenge): Details of the Authorization Challenge encountered.
            If this is set, client should respond with continueRequest that contains
            AuthChallengeResponse.
    """

    REQUEST_PAUSED = 'Fetch.requestPaused'
    """
    Issued when the domain is enabled and the request URL matches the specified filter.

    The request is paused until the client responds with one of continueRequest,
    failRequest or fulfillRequest. The stage of the request can be determined by
    presence of responseErrorReason and responseStatusCode -- the request is at the
    response stage if either of these fields is present and in the request stage otherwise.

    Redirect responses and subsequent requests are reported similarly to regular responses
    and requests. Redirect responses may be distinguished by the value of responseStatusCode
    (which is one of 301, 302, 303, 307, 308) along with presence of the location header.
    Requests resulting from a redirect will have redirectedRequestId field set.

    Args:
        requestId (RequestId): Each request the page makes will have a unique id.
        request (Network.Request): The details of the request.
        frameId (Page.FrameId): The id of the frame that initiated the request.
        resourceType (Network.ResourceType): How the requested resource will be used.
        responseErrorReason (Network.ErrorReason): Response error if intercepted at response stage.
        responseStatusCode (int): Response code if intercepted at response stage.
        responseStatusText (str): Response status text if intercepted at response stage.
        responseHeaders (array[HeaderEntry]): Response headers if intercepted at the response stage.
        networkId (Network.RequestId): If the intercepted request had a corresponding
            Network.requestWillBeSent event fired for it, then this networkId will be
            the same as the requestId present in the requestWillBeSent event.
        redirectedRequestId (RequestId): If the request is due to a redirect response
            from the server, the id of the request that has caused the redirect.
    """


class AuthRequiredEventParams(TypedDict):
    """Parameters for the AuthRequired event."""

    requestId: str
    request: Request
    frameId: str
    resourceType: ResourceType
    authChallenge: AuthChallenge


class RequestPausedEventParams(TypedDict):
    """Parameters for the RequestPaused event."""

    requestId: str
    request: Request
    frameId: str
    resourceType: ResourceType
    responseErrorReason: ErrorReason
    responseStatusCode: int
    responseStatusText: str


RequestPausedEvent = CDPEvent[RequestPausedEventParams]
AuthRequiredEvent = CDPEvent[AuthRequiredEventParams]


================================================
FILE: pydoll/protocol/fetch/methods.py
================================================
from enum import Enum

from typing_extensions import TypedDict

from pydoll.protocol.base import Command, EmptyParams, EmptyResponse, Response
from pydoll.protocol.fetch.types import (
    AuthChallengeResponse,
    HeaderEntry,
    RequestPattern,
)
from pydoll.protocol.io.types import StreamHandle
from pydoll.protocol.network.types import ErrorReason


class FetchMethod(str, Enum):
    """Fetch domain method names."""

    CONTINUE_REQUEST = 'Fetch.continueRequest'
    CONTINUE_RESPONSE = 'Fetch.continueResponse'
    CONTINUE_WITH_AUTH = 'Fetch.continueWithAuth'
    DISABLE = 'Fetch.disable'
    ENABLE = 'Fetch.enable'
    FAIL_REQUEST = 'Fetch.failRequest'
    FULFILL_REQUEST = 'Fetch.fulfillRequest'
    GET_RESPONSE_BODY = 'Fetch.getResponseBody'
    TAKE_RESPONSE_BODY_AS_STREAM = 'Fetch.takeResponseBodyAsStream'


RequestId = str


# Parameter types
class EnableParams(TypedDict, total=False):
    """Parameters for enabling the fetch domain."""

    patterns: list[RequestPattern]
    handleAuthRequests: bool


class FailRequestParams(TypedDict):
    """Parameters for failing a request."""

    requestId: RequestId
    errorReason: ErrorReason


class FulfillRequestParams(TypedDict, total=False):
    """Parameters for fulfilling a request."""

    requestId: RequestId
    responseCode: int
    responseHeaders: list[HeaderEntry]
    binaryResponseHeaders: str  # \0-separated name:value pairs (base64)
    body: str  # base64 encoded
    responsePhrase: str


class ContinueRequestParams(TypedDict, total=False):
    """Parameters for continuing a request."""

    requestId: RequestId
    url: str
    method: str
    postData: str  # base64 encoded
    headers: list[HeaderEntry]
    interceptResponse: bool


class ContinueWithAuthParams(TypedDict):
    """Parameters for continuing a request with authentication."""

    requestId: RequestId
    authChallengeResponse: AuthChallengeResponse


class ContinueResponseParams(TypedDict, total=False):
    """Parameters for continuing a response."""

    requestId: RequestId
    responseCode: int
    responsePhrase: str
    responseHeaders: list[HeaderEntry]
    binaryResponseHeaders: str  # \0-separated name:value pairs (base64)


class GetResponseBodyParams(TypedDict):
    """Parameters for getting response body."""

    requestId: RequestId


class TakeResponseBodyAsStreamParams(TypedDict):
    """Parameters for taking response body as stream."""

    requestId: RequestId


# Result types
class GetResponseBodyResult(TypedDict):
    """Result for getResponseBody command."""

    body: str
    base64Encoded: bool


class TakeResponseBodyAsStreamResult(TypedDict):
    """Result for takeResponseBodyAsStream command."""

    stream: StreamHandle


# Response types
GetResponseBodyResponse = Response[GetResponseBodyResult]
TakeResponseBodyAsStreamResponse = Response[TakeResponseBodyAsStreamResult]


# Command types
ContinueRequestCommand = Command[ContinueRequestParams, Response[EmptyResponse]]
ContinueResponseCommand = Command[ContinueResponseParams, Response[EmptyResponse]]
ContinueWithAuthCommand = Command[ContinueWithAuthParams, Response[EmptyResponse]]
DisableCommand = Command[EmptyParams, Response[EmptyResponse]]
EnableCommand = Command[EnableParams, Response[EmptyResponse]]
FailRequestCommand = Command[FailRequestParams, Response[EmptyResponse]]
FulfillRequestCommand = Command[FulfillRequestParams, Response[EmptyResponse]]
GetResponseBodyCommand = Command[GetResponseBodyParams, GetResponseBodyResponse]
TakeResponseBodyAsStreamCommand = Command[
    TakeResponseBodyAsStreamParams, TakeResponseBodyAsStreamResponse
]


================================================
FILE: pydoll/protocol/fetch/types.py
================================================
from enum import Enum

from typing_extensions import NotRequired, TypedDict

from pydoll.protocol.network.types import ResourceType


class RequestStage(str, Enum):
    """Stages of the request to handle."""

    REQUEST = 'Request'
    RESPONSE = 'Response'


class AuthChallengeSource(str, Enum):
    """Source of the authentication challenge."""

    SERVER = 'Server'
    PROXY = 'Proxy'


class AuthChallengeResponseType(str, Enum):
    """The decision on what to do in response to the authorization challenge."""

    DEFAULT = 'Default'
    CANCEL_AUTH = 'CancelAuth'
    PROVIDE_CREDENTIALS = 'ProvideCredentials'


class RequestPattern(TypedDict, total=False):
    """Pattern for request interception."""

    urlPattern: str  # Wildcards allowed. Omitting is equivalent to "*".
    resourceType: ResourceType
    requestStage: RequestStage


class HeaderEntry(TypedDict):
    """Response HTTP header entry."""

    name: str
    value: str


class AuthChallenge(TypedDict):
    """Authorization challenge for HTTP status code 401 or 407."""

    source: NotRequired[AuthChallengeSource]
    origin: str
    scheme: str  # e.g. basic, digest
    realm: str


class AuthChallengeResponse(TypedDict):
    """Response to an AuthChallenge."""

    response: AuthChallengeResponseType
    username: NotRequired[str]
    password: NotRequired[str]


================================================
FILE: pydoll/protocol/input/__init__.py
================================================
"""Input domain implementation."""


================================================
FILE: pydoll/protocol/input/events.py
================================================
from enum import Enum

from typing_extensions import TypedDict

from pydoll.protocol.base import CDPEvent
from pydoll.protocol.input.types import DragData


class InputEvent(str, Enum):
    """
    Events from the Input domain of the Chrome DevTools Protocol.

    This enumeration contains the names of Input-related events that can be
    received from the Chrome DevTools Protocol. These events provide information
    about user input interactions that can be intercepted or simulated.
    """

    DRAG_INTERCEPTED = 'Input.dragIntercepted'
    """
    Emitted only when Input.setInterceptDrags is enabled. Use this data with
    Input.dispatchDragEvent to restore normal drag and drop behavior.

    Args:
        data (DragData): Contains information about the dragged data.
    """


class DragInterceptedEventParams(TypedDict):
    """Parameters for dragIntercepted event."""

    data: DragData


DragInterceptedEvent = CDPEvent[DragInterceptedEventParams]


================================================
FILE: pydoll/protocol/input/methods.py
================================================
from enum import Enum

from typing_extensions import NotRequired, TypedDict

from pydoll.protocol.base import Command, EmptyParams, EmptyResponse, Response
from pydoll.protocol.input.types import (
    DragData,
    DragEventType,
    GestureSourceType,
    KeyEventType,
    MouseButton,
    MouseEventType,
    PointerType,
    TimeSinceEpoch,
    TouchEventType,
    TouchPoint,
)


class InputMethod(str, Enum):
    CANCEL_DRAGGING = 'Input.cancelDragging'
    DISPATCH_KEY_EVENT = 'Input.dispatchKeyEvent'
    DISPATCH_MOUSE_EVENT = 'Input.dispatchMouseEvent'
    DISPATCH_TOUCH_EVENT = 'Input.dispatchTouchEvent'
    SET_IGNORE_INPUT_EVENTS = 'Input.setIgnoreInputEvents'
    DISPATCH_DRAG_EVENT = 'Input.dispatchDragEvent'
    EMULATE_TOUCH_FROM_MOUSE_EVENT = 'Input.emulateTouchFromMouseEvent'
    IME_SET_COMPOSITION = 'Input.imeSetComposition'
    INSERT_TEXT = 'Input.insertText'
    SET_INTERCEPT_DRAGS = 'Input.setInterceptDrags'
    SYNTHESIZE_PINCH_GESTURE = 'Input.synthesizePinchGesture'
    SYNTHESIZE_SCROLL_GESTURE = 'Input.synthesizeScrollGesture'
    SYNTHESIZE_TAP_GESTURE = 'Input.synthesizeTapGesture'


class CancelDraggingParams(TypedDict):
    """Parameters for cancelDragging command."""

    pass


class DispatchDragEventParams(TypedDict):
    """Parameters for dispatchDragEvent command."""

    type: DragEventType
    x: float
    y: float
    data: DragData
    modifiers: NotRequired[int]


class DispatchKeyEventParams(TypedDict):
    """Parameters for dispatchKeyEvent command."""

    type: KeyEventType
    modifiers: NotRequired[int]
    timestamp: NotRequired[TimeSinceEpoch]
    text: NotRequired[str]
    unmodifiedText: NotRequired[str]
    keyIdentifier: NotRequired[str]
    code: NotRequired[str]
    key: NotRequired[str]
    windowsVirtualKeyCode: NotRequired[int]
    nativeVirtualKeyCode: NotRequired[int]
    autoRepeat: NotRequired[bool]
    isKeypad: NotRequired[bool]
    isSystemKey: NotRequired[bool]
    location: NotRequired[int]
    commands: NotRequired[list[str]]


class DispatchMouseEventParams(TypedDict):
    """Parameters for dispatchMouseEvent command."""

    type: MouseEventType
    x: float
    y: float
    modifiers: NotRequired[int]
    timestamp: NotRequired[TimeSinceEpoch]
    button: NotRequired[MouseButton]
    buttons: NotRequired[int]
    clickCount: NotRequired[int]
    force: NotRequired[float]
    tangentialPressure: NotRequired[float]
    tiltX: NotRequired[float]
    tiltY: NotRequired[float]
    twist: NotRequired[int]
    deltaX: NotRequired[float]
    deltaY: NotRequired[float]
    pointerType: NotRequired[PointerType]


class DispatchTouchEventParams(TypedDict):
    """Parameters for dispatchTouchEvent command."""

    type: TouchEventType
    touchPoints: list[TouchPoint]
    modifiers: NotRequired[int]
    timestamp: NotRequired[TimeSinceEpoch]


class EmulateTouchFromMouseEventParams(TypedDict):
    """Parameters for emulateTouchFromMouseEvent command."""

    type: MouseEventType
    x: int
    y: int
    button: MouseButton
    timestamp: NotRequired[TimeSinceEpoch]
    deltaX: NotRequired[float]
    deltaY: NotRequired[float]
    modifiers: NotRequired[int]
    clickCount: NotRequired[int]


class ImeSetCompositionParams(TypedDict):
    """Parameters for imeSetComposition command."""

    text: str
    selectionStart: int
    selectionEnd: int
    replacementStart: NotRequired[int]
    replacementEnd: NotRequired[int]


class InsertTextParams(TypedDict):
    """Parameters for insertText command."""

    text: str


class SetIgnoreInputEventsParams(TypedDict):
    """Parameters for setIgnoreInputEvents command."""

    ignore: bool


class SetInterceptDragsParams(TypedDict):
    """Parameters for setInterceptDrags command."""

    enabled: bool


class SynthesizePinchGestureParams(TypedDict):
    """Parameters for synthesizePinchGesture command."""

    x: float
    y: float
    scaleFactor: float
    relativeSpeed: NotRequired[int]
    gestureSourceType: NotRequired[GestureSourceType]


class SynthesizeScrollGestureParams(TypedDict):
    """Parameters for synthesizeScrollGesture command."""

    x: float
    y: float
    xDistance: NotRequired[float]
    yDistance: NotRequired[float]
    xOverscroll: NotRequired[float]
    yOverscroll: NotRequired[float]
    preventFling: NotRequired[bool]
    speed: NotRequired[int]
    gestureSourceType: NotRequired[GestureSourceType]
    repeatCount: NotRequired[int]
    repeatDelayMs: NotRequired[int]
    interactionMarkerName: NotRequired[str]


class SynthesizeTapGestureParams(TypedDict):
    """Parameters for synthesizeTapGesture command."""

    x: float
    y: float
    duration: NotRequired[int]
    tapCount: NotRequired[int]
    gestureSourceType: NotRequired[GestureSourceType]


# Command types
CancelDraggingCommand = Command[EmptyParams, Response[EmptyResponse]]
DispatchDragEventCommand = Command[DispatchDragEventParams, Response[EmptyResponse]]
DispatchKeyEventCommand = Command[DispatchKeyEventParams, Response[EmptyResponse]]
DispatchMouseEventCommand = Command[DispatchMouseEventParams, Response[EmptyResponse]]
DispatchTouchEventCommand = Command[DispatchTouchEventParams, Response[EmptyResponse]]
EmulateTouchFromMouseEventCommand = Command[
    EmulateTouchFromMouseEventParams, Response[EmptyResponse]
]
ImeSetCompositionCommand = Command[ImeSetCompositionParams, Response[EmptyResponse]]
InsertTextCommand = Command[InsertTextParams, Response[EmptyResponse]]
SetIgnoreInputEventsCommand = Command[SetIgnoreInputEventsParams, Response[EmptyResponse]]
SetInterceptDragsCommand = Command[SetInterceptDragsParams, Response[EmptyResponse]]
SynthesizePinchGestureCommand = Command[SynthesizePinchGestureParams, Response[EmptyResponse]]
SynthesizeScrollGestureCommand = Command[SynthesizeScrollGestureParams, Response[EmptyResponse]]
SynthesizeTapGestureCommand = Command[SynthesizeTapGestureParams, Response[EmptyResponse]]


================================================
FILE: pydoll/protocol/input/types.py
================================================
from enum import Enum

from typing_extensions import NotRequired, TypedDict

TimeSinceEpoch = float


class GestureSourceType(str, Enum):
    """Gesture source types."""

    DEFAULT = 'default'
    TOUCH = 'touch'
    MOUSE = 'mouse'


class MouseButton(str, Enum):
    """Mouse button types."""

    NONE = 'none'
    LEFT = 'left'
    MIDDLE = 'middle'
    RIGHT = 'right'
    BACK = 'back'
    FORWARD = 'forward'


class DragEventType(str, Enum):
    """Drag event types."""

    DRAG_ENTER = 'dragEnter'
    DRAG_OVER = 'dragOver'
    DROP = 'drop'
    DRAG_CANCEL = 'dragCancel'


class KeyEventType(str, Enum):
    """Key event types."""

    KEY_DOWN = 'keyDown'
    KEY_UP = 'keyUp'
    RAW_KEY_DOWN = 'rawKeyDown'
    CHAR = 'char'


class MouseEventType(str, Enum):
    """Mouse event types."""

    MOUSE_PRESSED = 'mousePressed'
    MOUSE_RELEASED = 'mouseReleased'
    MOUSE_MOVED = 'mouseMoved'
    MOUSE_WHEEL = 'mouseWheel'


class TouchEventType(str, Enum):
    """Touch event types."""

    TOUCH_START = 'touchStart'
    TOUCH_END = 'touchEnd'
    TOUCH_MOVE = 'touchMove'
    TOUCH_CANCEL = 'touchCancel'


class KeyModifier(int, Enum):
    ALT = 1
    CTRL = 2
    META = 4
    SHIFT = 8


class KeyLocation(int, Enum):
    LEFT = 1
    RIGHT = 2


class PointerType(str, Enum):
    """Pointer types."""

    MOUSE = 'mouse'
    PEN = 'pen'


class TouchPoint(TypedDict):
    """Touch point data."""

    x: float
    y: float
    radiusX: NotRequired[float]
    radiusY: NotRequired[float]
    rotationAngle: NotRequired[float]
    force: NotRequired[float]
    tangentialPressure: NotRequired[float]
    tiltX: NotRequired[float]
    tiltY: NotRequired[float]
    twist: NotRequired[int]
    id: NotRequired[float]


class DragDataItem(TypedDict):
    """Drag data item."""

    mimeType: str
    data: str
    title: NotRequired[str]
    baseURL: NotRequired[str]


class DragData(TypedDict):
    """Drag data."""

    items: list[DragDataItem]
    dragOperationsMask: int
    files: NotRequired[list[str]]


================================================
FILE: pydoll/protocol/io/types.py
================================================
StreamHandle = str


================================================
FILE: pydoll/protocol/network/__init__.py
================================================
"""Network domain implementation."""


================================================
FILE: pydoll/protocol/network/events.py
================================================
from enum import Enum

from typing_extensions import NotRequired, TypedDict

from pydoll.protocol.base import CDPEvent
from pydoll.protocol.network.types import (
    AssociatedCookie,
    AuthChallenge,
    BlockedReason,
    BlockedSetCookieWithReason,
    ClientSecurityState,
    ConnectTiming,
    CookiePartitionKey,
    CorsErrorStatus,
    DirectTCPSocketOptions,
    DirectUDPMessage,
    DirectUDPSocketOptions,
    ErrorReason,
    ExemptedSetCookieWithReason,
    Headers,
    Initiator,
    InterceptionId,
    IPAddressSpace,
    LoaderId,
    MonotonicTime,
    ReportingApiEndpoint,
    ReportingApiReport,
    Request,
    RequestId,
    ResourcePriority,
    ResourceType,
    Response,
    SignedExchangeInfo,
    TimeSinceEpoch,
    TrustTokenOperationType,
    WebSocketFrame,
    WebSocketRequest,
    WebSocketResponse,
)


class NetworkEvent(str, Enum):
    """
    Events from the Network domain of the Chrome DevTools Protocol.

    This enumeration contains the names of Network-related events that can be
    received from the Chrome DevTools Protocol. These events provide information
    about network activities, such as requests, responses, and WebSocket communications.
    """

    DATA_RECEIVED = 'Network.dataReceived'
    """
    Fired when data chunk was received over the network.

    Args:
        requestId (RequestId): Request identifier.
        timestamp (MonotonicTime): Timestamp.
        dataLength (int): Data chunk length.
        encodedDataLength (int): Actual bytes received (might be less than dataLength
            for compressed encodings).
        data (str): Data that was received. (Encoded as a base64 string when passed over JSON)
    """

    EVENT_SOURCE_MESSAGE_RECEIVED = 'Network.eventSourceMessageReceived'
    """
    Fired when EventSource message is received.

    Args:
        requestId (RequestId): Request identifier.
        timestamp (MonotonicTime): Timestamp.
        eventName (str): Message type.
        eventId (str): Message identifier.
        data (str): Message content.
    """

    LOADING_FAILED = 'Network.loadingFailed'
    """
    Fired when HTTP request has failed to load.

    Args:
        requestId (RequestId): Request identifier.
        timestamp (MonotonicTime): Timestamp.
        type (ResourceType): Resource type.
        errorText (str): Error message. List of network errors: https://cs.chromium.org/chromium/src/net/base/net_error_list.h
        canceled (bool): True if loading was canceled.
        blockedReason (BlockedReason): The reason why loading was blocked, if any.
        corsErrorStatus (CorsErrorStatus): The reason why loading was blocked by CORS, if any.
    """

    LOADING_FINISHED = 'Network.loadingFinished'
    """
    Fired when HTTP request has finished loading.

    Args:
        requestId (RequestId): Request identifier.
        timestamp (MonotonicTime): Timestamp.
        encodedDataLength (number): Total number of bytes received for this request.
    """

    REQUEST_SERVED_FROM_CACHE = 'Network.requestServedFromCache'
    """
    Fired if request ended up loading from cache.

    Args:
        requestId (RequestId): Request identifier.
    """

    REQUEST_WILL_BE_SENT = 'Network.requestWillBeSent'
    """
    Fired when page is about to send HTTP request.

    Args:
        requestId (RequestId): Request identifier.
        loaderId (LoaderId): Loader identifier. Empty string if the request is fetched from worker.
        documentURL (str): URL of the document this request is loaded for.
        request (Request): Request data.
        timestamp (MonotonicTime): Timestamp.
        wallTime (TimeSinceEpoch): Timestamp.
        initiator (Initiator): Request initiator.
        redirectHasExtraInfo (bool): In the case that redirectResponse is populated, this flag
            indicates whether requestWillBeSentExtraInfo and responseReceivedExtraInfo events
            will be or were emitted for the request which was just redirected.
        redirectResponse (Response): Redirect response data.
        type (ResourceType): Type of this resource.
        frameId (Page.FrameId): Frame identifier.
        hasUserGesture (bool): Whether the request is initiated by a user gesture.
            Defaults to false.
    """

    RESPONSE_RECEIVED = 'Network.responseReceived'
    """
    Fired when HTTP response is available.

    Args:
        requestId (RequestId): Request identifier.
        loaderId (LoaderId): Loader identifier. Empty string if the request is fetched from worker.
        timestamp (MonotonicTime): Timestamp.
        type (ResourceType): Resource type.
        response (Response): Response data.
        hasExtraInfo (bool): Indicates whether requestWillBeSentExtraInfo and
            responseReceivedExtraInfo events will be or were emitted for this request.
        frameId (Page.FrameId): Frame identifier.
    """

    WEBSOCKET_CLOSED = 'Network.webSocketClosed'
    """
    Fired when WebSocket is closed.

    Args:
        requestId (RequestId): Request identifier.
        timestamp (MonotonicTime): Timestamp.
    """

    WEBSOCKET_CREATED = 'Network.webSocketCreated'
    """
    Fired upon WebSocket creation.

    Args:
        requestId (RequestId): Request identifier.
        url (str): WebSocket request URL.
        initiator (Initiator): Request initiator.
    """

    WEBSOCKET_FRAME_ERROR = 'Network.webSocketFrameError'
    """
    Fired when WebSocket message error occurs.

    Args:
        requestId (RequestId): Request identifier.
        timestamp (MonotonicTime): Timestamp.
        errorMessage (str): WebSocket error message.
    """

    WEBSOCKET_FRAME_RECEIVED = 'Network.webSocketFrameReceived'
    """
    Fired when WebSocket message is received.

    Args:
        requestId (RequestId): Request identifier.
        timestamp (MonotonicTime): Timestamp.
        response (WebSocketFrame): WebSocket response data.
    """

    WEBSOCKET_FRAME_SENT = 'Network.webSocketFrameSent'
    """
    Fired when WebSocket message is sent.

    Args:
        requestId (RequestId): Request identifier.
        timestamp (MonotonicTime): Timestamp.
        response (WebSocketFrame): WebSocket response data.
    """

    WEBSOCKET_HANDSHAKE_RESPONSE_RECEIVED = 'Network.webSocketHandshakeResponseReceived'
    """
    Fired when WebSocket handshake response becomes available.

    Args:
        requestId (RequestId): Request identifier.
        timestamp (MonotonicTime): Timestamp.
        response (WebSocketResponse): WebSocket response data.
    """

    WEBSOCKET_WILL_SEND_HANDSHAKE_REQUEST = 'Network.webSocketWillSendHandshakeRequest'
    """
    Fired when WebSocket is about to initiate handshake.

    Args:
        requestId (RequestId): Request identifier.
        timestamp (MonotonicTime): Timestamp.
        wallTime (TimeSinceEpoch): UTC Timestamp.
        request (WebSocketRequest): WebSocket request data.
    """

    WEBTRANSPORT_CLOSED = 'Network.webTransportClosed'
    """
    Fired when WebTransport is disposed.

    Args:
        transportId (RequestId): WebTransport identifier.
        timestamp (MonotonicTime): Timestamp.
    """

    WEBTRANSPORT_CONNECTION_ESTABLISHED = 'Network.webTransportConnectionEstablished'
    """
    Fired when WebTransport handshake is finished.

    Args:
        transportId (RequestId): WebTransport identifier.
        timestamp (MonotonicTime): Timestamp.
    """

    WEBTRANSPORT_CREATED = 'Network.webTransportCreated'
    """
    Fired upon WebTransport creation.

    Args:
        transportId (RequestId): WebTransport identifier.
        url (str): WebTransport request URL.
        timestamp (MonotonicTime): Timestamp.
        initiator (Initiator): Request initiator.
    """

    DIRECT_TCP_SOCKET_ABORTED = 'Network.directTCPSocketAborted'
    """
    Fired when direct_socket.TCPSocket is aborted.

    Args:
        identifier (RequestId): Request identifier.
        errorMessage (str): Error message.
        timestamp (MonotonicTime): Timestamp.
    """

    DIRECT_TCP_SOCKET_CHUNK_RECEIVED = 'Network.directTCPSocketChunkReceived'
    """
    Fired when data is received from tcp direct socket stream.

    Args:
        identifier (RequestId): Request identifier.
        data (str): Data received.
        timestamp (MonotonicTime): Timestamp.
    """

    DIRECT_TCP_SOCKET_CHUNK_SENT = 'Network.directTCPSocketChunkSent'
    """
    Fired when data is sent to tcp direct socket stream.

    Args:
        identifier (RequestId): Request identifier.
        data (str): Data sent.
        timestamp (MonotonicTime): Timestamp.
    """

    DIRECT_TCP_SOCKET_CLOSED = 'Network.directTCPSocketClosed'
    """
    Fired when direct_socket.TCPSocket is closed.

    Args:
        identifier (RequestId): Request identifier.
        timestamp (MonotonicTime): Timestamp.
    """

    DIRECT_TCP_SOCKET_CREATED = 'Network.directTCPSocketCreated'
    """
    Fired upon direct_socket.TCPSocket creation.

    Args:
        identifier (RequestId): Request identifier.
        remoteAddr (str): Remote address.
        remotePort (int): Remote port. Unsigned int 16.
        options (DirectTCPSocketOptions): Socket options.
        timestamp (MonotonicTime): Timestamp.
        initiator (Initiator): Request initiator.
    """

    DIRECT_TCP_SOCKET_OPENED = 'Network.directTCPSocketOpened'
    """
    Fired when direct_socket.TCPSocket connection is opened.

    Args:
        identifier (RequestId): Request identifier.
        remoteAddr (str): Remote address.
        remotePort (int): Remote port. Expected to be unsigned integer.
        timestamp (MonotonicTime): Timestamp.
        localAddr (str): Local address.
        localPort (int): Local port. Expected to be unsigned integer.
    """

    DIRECT_UDP_SOCKET_ABORTED = 'Network.directUDPSocketAborted'
    """
    Fired when direct_socket.UDPSocket is aborted.

    Args:
        identifier (RequestId): Request identifier.
        errorMessage (str): Error message.
        timestamp (MonotonicTime): Timestamp.
    """

    DIRECT_UDP_SOCKET_CHUNK_RECEIVED = 'Network.directUDPSocketChunkReceived'
    """
    Fired when message is received from udp direct socket stream.

    Args:
        identifier (RequestId): Request identifier.
        message (DirectUDPMessage): Message data.
        timestamp (MonotonicTime): Timestamp.
    """

    DIRECT_UDP_SOCKET_CHUNK_SENT = 'Network.directUDPSocketChunkSent'
    """
    Fired when message is sent to udp direct socket stream.

    Args:
        identifier (RequestId): Request identifier.
        message (DirectUDPMessage): Message data.
        timestamp (MonotonicTime): Timestamp.
    """

    DIRECT_UDP_SOCKET_CLOSED = 'Network.directUDPSocketClosed'
    """
    Fired when direct_socket.UDPSocket is closed.

    Args:
        identifier (RequestId): Request identifier.
        timestamp (MonotonicTime): Timestamp.
    """

    DIRECT_UDP_SOCKET_CREATED = 'Network.directUDPSocketCreated'
    """
    Fired upon direct_socket.UDPSocket creation.

    Args:
        identifier (RequestId): Request identifier.
        options (DirectUDPSocketOptions): Socket options.
        timestamp (MonotonicTime): Timestamp.
        initiator (Initiator): Request initiator.
    """

    DIRECT_UDP_SOCKET_OPENED = 'Network.directUDPSocketOpened'
    """
    Fired when direct_socket.UDPSocket connection is opened.

    Args:
        identifier (RequestId): Request identifier.
        localAddr (str): Local address.
        localPort (int): Local port. Expected to be unsigned integer.
        timestamp (MonotonicTime): Timestamp.
        remoteAddr (str): Remote address.
        remotePort (int): Remote port. Expected to be unsigned integer.
    """

    POLICY_UPDATED = 'Network.policyUpdated'
    """
    Fired once security policy has been updated.
    """

    REPORTING_API_ENDPOINTS_CHANGED_FOR_ORIGIN = 'Network.reportingApiEndpointsChangedForOrigin'
    """
    Fired when Reporting API endpoints change for an origin.

    Args:
        origin (str): Origin of the document(s) which configured the endpoints.
        endpoints (array[ReportingApiEndpoint]): The endpoints configured for the origin.
    """

    REPORTING_API_REPORT_ADDED = 'Network.reportingApiReportAdded'
    """
    Is sent whenever a new report is added. And after 'enableReportingApi' for all existing reports.

    Args:
        report (ReportingApiReport): The report that was added.
    """

    REPORTING_API_REPORT_UPDATED = 'Network.reportingApiReportUpdated'
    """
    Fired when a report is updated.

    Args:
        report (ReportingApiReport): The report that was updated.
    """

    REQUEST_WILL_BE_SENT_EXTRA_INFO = 'Network.requestWillBeSentExtraInfo'
    """
    Fired when additional information about a requestWillBeSent event is available from the network
    stack.
    Not every requestWillBeSent event will have an additional requestWillBeSentExtraInfo fired for
    it, and there is no guarantee whether requestWillBeSent or requestWillBeSentExtraInfo will be
    fired first for the same request.

    Args:
        requestId (RequestId): Request identifier. Used to match this information to an existing
            requestWillBeSent event.
        associatedCookies (array[AssociatedCookie]): A list of cookies potentially associated to
            the requested URL. This includes both cookies sent with the request and the ones
            not sent; the latter are distinguished by having blockedReasons field set.
        headers (Headers): Raw request headers as they will be sent over the wire.
        connectTiming (ConnectTiming): Connection timing information for the request.
        clientSecurityState (ClientSecurityState): The client security state set for the request.
        siteHasCookieInOtherPartition (bool): Whether the site has partitioned cookies stored
            in a partition different than the current one.
    """

    RESOURCE_CHANGED_PRIORITY = 'Network.resourceChangedPriority'
    """
    Fired when resource loading priority is changed.

    Args:
        requestId (RequestId): Request identifier.
        newPriority (ResourcePriority): New priority.
        timestamp (MonotonicTime): Timestamp.
    """

    RESPONSE_RECEIVED_EARLY_HINTS = 'Network.responseReceivedEarlyHints'
    """
    Fired when 103 Early Hints headers is received in addition to the common response.
    Not every responseReceived event will have an responseReceivedEarlyHints fired.
    Only one responseReceivedEarlyHints may be fired for eached responseReceived event.

    Args:
        requestId (RequestId): Request identifier. Used to match this information to another
            responseReceived event.
        headers (Headers): Raw response headers as they were received over the wire. Duplicate
            headers in the response are represented as a single key with their values
            concatentated using \\n as the separator. See also headersText that contains
            verbatim text for HTTP/1.*.
    """

    RESPONSE_RECEIVED_EXTRA_INFO = 'Network.responseReceivedExtraInfo'
    """
    Fired when additional information about a responseReceived event is available from the
    network stack.
    Not every responseReceived event will have an additional responseReceivedExtraInfo for it,
    and responseReceivedExtraInfo may be fired before or after responseReceived.

    Args:
        requestId (RequestId): Request identifier. Used to match this information to another
            responseReceived event.
        blockedCookies (array[BlockedSetCookieWithReason]): A list of cookies which were
            not stored from the response along with the corresponding reasons for blocking.
            The cookies here may not be valid due to syntax errors, which are represented by
            the invalid cookie line string instead of a proper cookie.
        headers (Headers): Raw response headers as they were received over the wire. Duplicate
            headers in the response are represented as a single key with their values concatentated
            using \\n as the separator. See also headersText that contains verbatim
            text for HTTP/1.*.
        resourceIPAddressSpace (IPAddressSpace): The IP address space of the resource. The address
            space can only be determined once the transport established the connection, so we
            can't send it in requestWillBeSentExtraInfo.
        statusCode (int): The status code of the response. This is useful in cases the request
            failed and no responseReceived event is triggered, which is the case for, e.g.,
            CORS errors. This is also the correct status code for cached requests, where the
            status in responseReceived is a 200 and this will be 304.
        headersText (str): Raw response header text as it was received over the wire. The raw text
            may not always be available, such as in the case of HTTP/2 or QUIC.
        cookiePartitionKey (CookiePartitionKey): The cookie partition key that will be used to
            store partitioned cookies set in this response. Only sent when partitioned
            cookies are enabled.
        cookiePartitionKeyOpaque (bool): True if partitioned cookies are enabled, but the
            partition key is not serializable to string.
        exemptedCookies (array[ExemptedSetCookieWithReason]): A list of cookies which should have
            been blocked by 3PCD but are exempted and stored from the response with the
            corresponding reason.
    """

    SIGNED_EXCHANGE_RECEIVED = 'Network.signedExchangeReceived'
    """
    Fired when a signed exchange was received over the network.

    Args:
        requestId (RequestId): Request identifier.
        info (SignedExchangeInfo): Information about the signed exchange response.
    """

    SUBRESOURCE_WEB_BUNDLE_INNER_RESPONSE_ERROR = 'Network.subresourceWebBundleInnerResponseError'
    """
    Fired when request for resources within a .wbn file failed.

    Args:
        innerRequestId (RequestId): Request identifier of the subresource request.
        innerRequestURL (str): URL of the subresource resource.
        errorMessage (str): Error message.
        bundleRequestId (RequestId): Bundle request identifier. Used to match this information
            to another event. This made be absent in case when the instrumentation was enabled
            only after webbundle was parsed.
    """

    SUBRESOURCE_WEB_BUNDLE_INNER_RESPONSE_PARSED = 'Network.subresourceWebBundleInnerResponseParsed'
    """
    Fired when handling requests for resources within a .wbn file.
    Note: this will only be fired for resources that are requested by the webpage.

    Args:
        innerRequestId (RequestId): Request identifier of the subresource request.
        innerRequestURL (str): URL of the subresource resource.
        bundleRequestId (RequestId): Bundle request identifier. Used to match this information
            to another event. This made be absent in case when the instrumentation was enabled
            only after webbundle was parsed.
    """

    SUBRESOURCE_WEB_BUNDLE_METADATA_ERROR = 'Network.subresourceWebBundleMetadataError'
    """
    Fired once when parsing the .wbn file has failed.

    Args:
        requestId (RequestId): Request identifier. Used to match this information to another event.
        errorMessage (str): Error message.
    """

    SUBRESOURCE_WEB_BUNDLE_METADATA_RECEIVED = 'Network.subresourceWebBundleMetadataReceived'
    """
    Fired once when parsing the .wbn file has succeeded. The event contains the information
    about the web bundle contents.

    Args:
        requestId (RequestId): Request identifier. Used to match this information to another event.
        urls (array[str]): A list of URLs of resources in the subresource Web Bundle.
    """

    TRUST_TOKEN_OPERATION_DONE = 'Network.trustTokenOperationDone'
    """
    Fired exactly once for each Trust Token operation. Depending on the type of the operation
    and whether the operation succeeded or failed, the event is fired before the corresponding
    request was sent or after the response was received.

    Args:
        status (str): Detailed success or error status of the operation.
            Allowed Values: Ok, InvalidArgument, MissingIssuerKeys, FailedPrecondition,
            ResourceExhausted, AlreadyExists, ResourceLimited, Unauthorized, BadResponse,
            InternalError, UnknownError, FulfilledLocally, SiteIssuerLimit
        type (TrustTokenOperationType): Type of Trust Token operation.
        requestId (RequestId): Request identifier.
        topLevelOrigin (str): Top level origin. The context in which the operation was attempted.
        issuerOrigin (str): Origin of the issuer in case of a "Issuance" or "Redemption" operation.
        issuedTokenCount (int): The number of obtained Trust Tokens on a successful
            "Issuance" operation.
    """


class DataReceivedEventParams(TypedDict):
    requestId: RequestId
    timestamp: MonotonicTime
    dataLength: int
    encodedDataLength: int
    data: NotRequired[str]


class EventSourceMessageReceivedEventParams(TypedDict):
    requestId: RequestId
    timestamp: MonotonicTime
    eventName: str
    eventId: str
    data: str


class LoadingFailedEventParams(TypedDict):
    requestId: RequestId
    timestamp: MonotonicTime
    type: ResourceType
    errorText: str
    canceled: NotRequired[bool]
    blockedReason: NotRequired[BlockedReason]
    corsErrorStatus: NotRequired[CorsErrorStatus]


class LoadingFinishedEventParams(TypedDict):
    requestId: RequestId
    timestamp: MonotonicTime
    encodedDataLength: float


class RequestInterceptedEventParams(TypedDict):
    interceptionId: InterceptionId
    request: Request
    frameId: str
    resourceType: ResourceType
    isNavigationRequest: bool
    isDownload: NotRequired[bool]
    redirectUrl: NotRequired[str]
    authChallenge: NotRequired[AuthChallenge]
    responseErrorReason: NotRequired[ErrorReason]
    responseStatusCode: NotRequired[int]
    responseHeaders: NotRequired[Headers]
    requestId: NotRequired[RequestId]


class RequestServedFromCacheEventParams(TypedDict):
    requestId: RequestId


class RequestWillBeSentEventParams(TypedDict):
    requestId: RequestId
    loaderId: LoaderId
    documentURL: str
    request: Request
    timestamp: MonotonicTime
    wallTime: TimeSinceEpoch
    initiator: Initiator
    redirectHasExtraInfo: bool
    redirectResponse: NotRequired[Response]
    type: NotRequired[ResourceType]
    frameId: NotRequired[str]
    hasUserGesture: NotRequired[bool]


class ResourceChangedPriorityEventParams(TypedDict):
    requestId: RequestId
    newPriority: ResourcePriority
    timestamp: MonotonicTime


class SignedExchangeReceivedEventParams(TypedDict):
    requestId: RequestId
    info: SignedExchangeInfo


class ResponseReceivedEventParams(TypedDict):
    requestId: RequestId
    loaderId: LoaderId
    timestamp: MonotonicTime
    type: ResourceType
    response: Response
    hasExtraInfo: bool
    frameId: NotRequired[str]


class WebSocketClosedEventParams(TypedDict):
    requestId: RequestId
    timestamp: MonotonicTime


class WebSocketCreatedEventParams(TypedDict):
    requestId: RequestId
    url: str
    initiator: NotRequired[Initiator]


class WebSocketFrameErrorEventParams(TypedDict):
    requestId: RequestId
    timestamp: MonotonicTime
    errorMessage: str


class WebSocketFrameReceivedEventParams(TypedDict):
    requestId: RequestId
    timestamp: MonotonicTime
    response: WebSocketFrame


class WebSocketFrameSentEventParams(TypedDict):
    requestId: RequestId
    timestamp: MonotonicTime
    response: WebSocketFrame


class WebSocketHandshakeResponseReceivedEventParams(TypedDict):
    requestId: RequestId
    timestamp: MonotonicTime
    response: WebSocketResponse


class WebSocketWillSendHandshakeRequestEventParams(TypedDict):
    requestId: RequestId
    timestamp: MonotonicTime
    wallTime: TimeSinceEpoch
    request: WebSocketRequest


class WebTransportCreatedEventParams(TypedDict):
    transportId: RequestId
    url: str
    timestamp: MonotonicTime
    initiator: NotRequired[Initiator]


class WebTransportConnectionEstablishedEventParams(TypedDict):
    transportId: RequestId
    timestamp: MonotonicTime


class WebTransportClosedEventParams(TypedDict):
    transportId: RequestId
    timestamp: MonotonicTime


class DirectTCPSocketCreatedEventParams(TypedDict):
    identifier: RequestId
    remoteAddr: str
    remotePort: int
    options: DirectTCPSocketOptions
    timestamp: MonotonicTime
    initiator: NotRequired[Initiator]


class DirectTCPSocketOpenedEventParams(TypedDict):
    identifier: RequestId
    remoteAddr: str
    remotePort: int
    timestamp: MonotonicTime
    localAddr: NotRequired[str]
    localPort: NotRequired[int]


class DirectTCPSocketAbortedEventParams(TypedDict):
    identifier: RequestId
    errorMessage: str
    timestamp: MonotonicTime


class DirectTCPSocketClosedEventParams(TypedDict):
    identifier: RequestId
    timestamp: MonotonicTime


class DirectTCPSocketChunkSentEventParams(TypedDict):
    identifier: RequestId
    data: str
    timestamp: MonotonicTime


class DirectTCPSocketChunkReceivedEventParams(TypedDict):
    identifier: RequestId
    data: str
    timestamp: MonotonicTime


class DirectUDPSocketCreatedEventParams(TypedDict):
    identifier: RequestId
    options: DirectUDPSocketOptions
    timestamp: MonotonicTime
    initiator: NotRequired[Initiator]


class DirectUDPSocketOpenedEventParams(TypedDict):
    identifier: RequestId
    localAddr: str
    localPort: int
    timestamp: MonotonicTime
    remoteAddr: NotRequired[str]
    remotePort: NotRequired[int]


class DirectUDPSocketAbortedEventParams(TypedDict):
    identifier: RequestId
    errorMessage: str
    timestamp: MonotonicTime


class DirectUDPSocketClosedEventParams(TypedDict):
    identifier: RequestId
    timestamp: MonotonicTime


class DirectUDPSocketChunkSentEventParams(TypedDict):
    identifier: RequestId
    message: DirectUDPMessage
    timestamp: MonotonicTime


class DirectUDPSocketChunkReceivedEventParams(TypedDict):
    identifier: RequestId
    message: DirectUDPMessage
    timestamp: MonotonicTime


class RequestWillBeSentExtraInfoEventParams(TypedDict):
    requestId: RequestId
    associatedCookies: list[AssociatedCookie]
    headers: Headers
    connectTiming: ConnectTiming
    clientSecurityState: NotRequired[ClientSecurityState]
    siteHasCookieInOtherPartition: NotRequired[bool]


class ResponseReceivedExtraInfoEventParams(TypedDict):
    requestId: RequestId
    blockedCookies: list[BlockedSetCookieWithReason]
    headers: Headers
    resourceIPAddressSpace: IPAddressSpace
    statusCode: int
    headersText: NotRequired[str]
    cookiePartitionKey: NotRequired[CookiePartitionKey]
    cookiePartitionKeyOpaque: NotRequired[bool]
    exemptedCookies: NotRequired[list[ExemptedSetCookieWithReason]]


class ResponseReceivedEarlyHintsEventParams(TypedDict):
    requestId: RequestId
    headers: Headers


class TrustTokenOperationDoneEventParams(TypedDict):
    status: str  # enum values: Ok, InvalidArgument, etc.
    type: TrustTokenOperationType
    requestId: RequestId
    topLevelOrigin: NotRequired[str]
    issuerOrigin: NotRequired[str]
    issuedTokenCount: NotRequired[int]


class PolicyUpdatedEventParams(TypedDict):
    pass


class SubresourceWebBundleMetadataReceivedEventParams(TypedDict):
    requestId: RequestId
    urls: list[str]


class SubresourceWebBundleMetadataErrorEventParams(TypedDict):
    requestId: RequestId
    errorMessage: str


class SubresourceWebBundleInnerResponseParsedEventParams(TypedDict):
    innerRequestId: RequestId
    innerRequestURL: str
    bundleRequestId: NotRequired[RequestId]


class SubresourceWebBundleInnerResponseErrorEventParams(TypedDict):
    innerRequestId: RequestId
    innerRequestURL: str
    errorMessage: str
    bundleRequestId: NotRequired[RequestId]


class ReportingApiReportAddedEventParams(TypedDict):
    report: ReportingApiReport


class ReportingApiReportUpdatedEventParams(TypedDict):
    report: ReportingApiReport


class ReportingApiEndpointsChangedForOriginEventParams(TypedDict):
    origin: str
    endpoints: list[ReportingApiEndpoint]


DataReceivedEvent = CDPEvent[DataReceivedEventParams]
EventSourceMessageReceivedEvent = CDPEvent[EventSourceMessageReceivedEventParams]
LoadingFailedEvent = CDPEvent[LoadingFailedEventParams]
LoadingFinishedEvent = CDPEvent[LoadingFinishedEventParams]
RequestInterceptedEvent = CDPEvent[RequestInterceptedEventParams]
RequestServedFromCacheEvent = CDPEvent[RequestServedFromCacheEventParams]
RequestWillBeSentEvent = CDPEvent[RequestWillBeSentEventParams]
ResourceChangedPriorityEvent = CDPEvent[ResourceChangedPriorityEventParams]
SignedExchangeReceivedEvent = CDPEvent[SignedExchangeReceivedEventParams]
ResponseReceivedEvent = CDPEvent[ResponseReceivedEventParams]
WebSocketClosedEvent = CDPEvent[WebSocketClosedEventParams]
WebSocketCreatedEvent = CDPEvent[WebSocketCreatedEventParams]
WebSocketFrameErrorEvent = CDPEvent[WebSocketFrameErrorEventParams]
WebSocketFrameReceivedEvent = CDPEvent[WebSocketFrameReceivedEventParams]
WebSocketFrameSentEvent = CDPEvent[WebSocketFrameSentEventParams]
WebSocketHandshakeResponseReceivedEvent = CDPEvent[WebSocketHandshakeResponseReceivedEventParams]
WebSocketWillSendHandshakeRequestEvent = CDPEvent[WebSocketWillSendHandshakeRequestEventParams]
WebTransportCreatedEvent = CDPEvent[WebTransportCreatedEventParams]
WebTransportConnectionEstablishedEvent = CDPEvent[WebTransportConnectionEstablishedEventParams]
WebTransportClosedEvent = CDPEvent[WebTransportClosedEventParams]
DirectTCPSocketCreatedEvent = CDPEvent[DirectTCPSocketCreatedEventParams]
DirectTCPSocketOpenedEvent = CDPEvent[DirectTCPSocketOpenedEventParams]
DirectTCPSocketAbortedEvent = CDPEvent[DirectTCPSocketAbortedEventParams]
DirectTCPSocketClosedEvent = CDPEvent[DirectTCPSocketClosedEventParams]
DirectTCPSocketChunkSentEvent = CDPEvent[DirectTCPSocketChunkSentEventParams]
DirectTCPSocketChunkReceivedEvent = CDPEvent[DirectTCPSocketChunkReceivedEventParams]
DirectUDPSocketCreatedEvent = CDPEvent[DirectUDPSocketCreatedEventParams]
DirectUDPSocketOpenedEvent = CDPEvent[DirectUDPSocketOpenedEventParams]
DirectUDPSocketAbortedEvent = CDPEvent[DirectUDPSocketAbortedEventParams]
DirectUDPSocketClosedEvent = CDPEvent[DirectUDPSocketClosedEventParams]
DirectUDPSocketChunkSentEvent = CDPEvent[DirectUDPSocketChunkSentEventParams]
DirectUDPSocketChunkReceivedEvent = CDPEvent[DirectUDPSocketChunkReceivedEventParams]
RequestWillBeSentExtraInfoEvent = CDPEvent[RequestWillBeSentExtraInfoEventParams]
ResponseReceivedExtraInfoEvent = CDPEvent[ResponseReceivedExtraInfoEventParams]
ResponseReceivedEarlyHintsEvent = CDPEvent[ResponseReceivedEarlyHintsEventParams]
TrustTokenOperationDoneEvent = CDPEvent[TrustTokenOperationDoneEventParams]
PolicyUpdatedEvent = CDPEvent[PolicyUpdatedEventParams]
SubresourceWebBundleMetadataReceivedEvent = CDPEvent[
    SubresourceWebBundleMetadataReceivedEventParams
]
SubresourceWebBundleMetadataErrorEvent = CDPEvent[SubresourceWebBundleMetadataErrorEventParams]
SubresourceWebBundleInnerResponseParsedEvent = CDPEvent[
    SubresourceWebBundleInnerResponseParsedEventParams
]
SubresourceWebBundleInnerResponseErrorEvent = CDPEvent[
    SubresourceWebBundleInnerResponseErrorEventParams
]
ReportingApiReportAddedEvent = CDPEvent[ReportingApiReportAddedEventParams]
ReportingApiReportUpdatedEvent = CDPEvent[ReportingApiReportUpdatedEventParams]
ReportingApiEndpointsChangedForOriginEvent = CDPEvent[
    ReportingApiEndpointsChangedForOriginEventParams
]


================================================
FILE: pydoll/protocol/network/har_types.py
================================================
"""HAR 1.2 format type definitions.

Based on the HAR 1.2 specification: http://www.softwareishard.com/blog/har-12-spec/
These TypedDicts define the structure of HAR (HTTP Archive) files used for
recording and replaying network traffic.
"""

from __future__ import annotations

from typing_extensions import NotRequired, TypedDict


class HarTimings(TypedDict):
    """Timing information about a request/response round trip."""

    blocked: float
    dns: float
    connect: float
    ssl: float
    send: float
    wait: float
    receive: float


class HarCookie(TypedDict):
    """Cookie used in a request or response."""

    name: str
    value: str
    path: NotRequired[str]
    domain: NotRequired[str]
    expires: NotRequired[str]
    httpOnly: NotRequired[bool]
    secure: NotRequired[bool]


class HarHeader(TypedDict):
    """HTTP header name-value pair."""

    name: str
    value: str


class HarQueryParam(TypedDict):
    """URL query string parameter."""

    name: str
    value: str


class HarPostData(TypedDict):
    """Posted data info."""

    mimeType: str
    text: str
    params: NotRequired[list[dict]]


class HarRequest(TypedDict):
    """Detailed info about the request."""

    method: str
    url: str
    httpVersion: str
    cookies: list[HarCookie]
    headers: list[HarHeader]
    queryString: list[HarQueryParam]
    headersSize: int
    bodySize: int
    postData: NotRequired[HarPostData]


class HarContent(TypedDict):
    """Response content body info."""

    size: int
    mimeType: str
    text: NotRequired[str]
    encoding: NotRequired[str]


class HarResponse(TypedDict):
    """Detailed info about the response."""

    status: int
    statusText: str
    httpVersion: str
    cookies: list[HarCookie]
    headers: list[HarHeader]
    content: HarContent
    redirectURL: str
    headersSize: int
    bodySize: int


class HarCache(TypedDict, total=False):
    """Cache state for a request/response pair."""

    beforeRequest: dict
    afterRequest: dict


class HarEntry(TypedDict):
    """Represents an exported HTTP request."""

    startedDateTime: str
    time: float
    request: HarRequest
    response: HarResponse
    cache: HarCache
    timings: HarTimings
    serverIPAddress: NotRequired[str]
    connection: NotRequired[str]
    _resourceType: NotRequired[str]


class HarPage(TypedDict):
    """Represents an exported page."""

    startedDateTime: str
    id: str
    title: str


class HarCreator(TypedDict):
    """Information about the creator of the HAR file."""

    name: str
    version: str


class HarLog(TypedDict):
    """Root of the HAR data."""

    version: str
    creator: HarCreator
    pages: list[HarPage]
    entries: list[HarEntry]


class Har(TypedDict):
    """Top-level HAR object."""

    log: HarLog


================================================
FILE: pydoll/protocol/network/methods.py
================================================
from enum import Enum

from typing_extensions import NotRequired, TypedDict

from pydoll.protocol.base import Command, EmptyParams, EmptyResponse, Response
from pydoll.protocol.debugger.types import SearchMatch
from pydoll.protocol.emulation.types import UserAgentMetadata
from pydoll.protocol.fetch.types import HeaderEntry, RequestPattern
from pydoll.protocol.network.types import (
    ConnectionType,
    ContentEncoding,
    Cookie,
    CookiePartitionKey,
    CookiePriority,
    CookieSameSite,
    CookieSourceScheme,
    LoadNetworkResourceOptions,
    SecurityIsolationStatus,
)


class NetworkMethod(str, Enum):
    CLEAR_BROWSER_CACHE = 'Network.clearBrowserCache'
    CLEAR_BROWSER_COOKIES = 'Network.clearBrowserCookies'
    DELETE_COOKIES = 'Network.deleteCookies'
    DISABLE = 'Network.disable'
    EMULATE_NETWORK_CONDITIONS = 'Network.emulateNetworkConditions'
    ENABLE = 'Network.enable'
    GET_COOKIES = 'Network.getCookies'
    GET_REQUEST_POST_DATA = 'Network.getRequestPostData'
    GET_RESPONSE_BODY = 'Network.getResponseBody'
    SET_BYPASS_SERVICE_WORKER = 'Network.setBypassServiceWorker'
    SET_CACHE_DISABLED = 'Network.setCacheDisabled'
    SET_COOKIE = 'Network.setCookie'
    SET_COOKIES = 'Network.setCookies'
    SET_EXTRA_HTTP_HEADERS = 'Network.setExtraHTTPHeaders'
    SET_USER_AGENT_OVERRIDE = 'Network.setUserAgentOverride'
    CLEAR_ACCEPTED_ENCODINGS_OVERRIDE = 'Network.clearAcceptedEncodingsOverride'
    ENABLE_REPORTING_API = 'Network.enableReportingApi'
    GET_CERTIFICATE = 'Network.getCertificate'
    GET_RESPONSE_BODY_FOR_INTERCEPTION = 'Network.getResponseBodyForInterception'
    GET_SECURITY_ISOLATION_STATUS = 'Network.getSecurityIsolationStatus'
    LOAD_NETWORK_RESOURCE = 'Network.loadNetworkResource'
    REPLAY_XHR = 'Network.replayXHR'
    SEARCH_IN_RESPONSE_BODY = 'Network.searchInResponseBody'
    SET_ACCEPTED_ENCODINGS = 'Network.setAcceptedEncodings'
    SET_ATTACH_DEBUG_STACK = 'Network.setAttachDebugStack'
    SET_BLOCKED_URLS = 'Network.setBlockedURLs'
    SET_COOKIE_CONTROLS = 'Network.setCookieControls'
    STREAM_RESOURCE_CONTENT = 'Network.streamResourceContent'
    TAKE_RESPONSE_BODY_FOR_INTERCEPTION_AS_STREAM = (
        'Network.takeResponseBodyForInterceptionAsStream'
    )


class DeleteCookiesParams(TypedDict):
    """Parameters for deleting browser cookies."""

    name: str
    url: NotRequired[str]
    domain: NotRequired[str]
    path: NotRequired[str]
    partitionKey: NotRequired[CookiePartitionKey]


class EmulateNetworkConditionsParams(TypedDict):
    """Parameters for emulating network conditions."""

    offline: bool
    latency: float
    downloadThroughput: float
    uploadThroughput: float
    connectionType: NotRequired[ConnectionType]
    packetLoss: NotRequired[float]
    packetQueueLength: NotRequired[int]
    packetReordering: NotRequired[bool]


class NetworkEnableParams(TypedDict):
    """Parameters for enabling network tracking."""

    maxTotalBufferSize: NotRequired[int]
    maxResourceBufferSize: NotRequired[int]
    maxPostDataSize: NotRequired[int]


class GetCookiesParams(TypedDict):
    """Parameters for retrieving browser cookies."""

    urls: NotRequired[list[str]]


class GetRequestPostDataParams(TypedDict):
    """Parameters for retrieving request POST data."""

    requestId: str


class GetResponseBodyParams(TypedDict):
    """Parameters for retrieving response body."""

    requestId: str


class GetCertificateParams(TypedDict):
    """Parameters for retrieving DER-encoded certificate."""

    origin: str


class GetResponseBodyForInterceptionParams(TypedDict):
    """Parameters for retrieving response body for intercepted request."""

    interceptionId: str


class SearchInResponseBodyParams(TypedDict):
    """Parameters for searching in response content."""

    requestId: str
    query: str
    caseSensitive: NotRequired[bool]
    isRegex: NotRequired[bool]


class SetBypassServiceWorkerParams(TypedDict):
    """Parameters for toggling service worker bypass."""

    bypass: bool


class SetCacheDisabledParams(TypedDict):
    """Parameters for toggling cache for requests."""

    cacheDisabled: bool


class SetCookieParams(TypedDict):
    """Parameters for setting a cookie."""

    name: str
    value: str
    url: NotRequired[str]
    domain: NotRequired[str]
    path: NotRequired[str]
    secure: NotRequired[bool]
    httpOnly: NotRequired[bool]
    sameSite: NotRequired[CookieSameSite]
    expires: NotRequired[float]
    priority: NotRequired[CookiePriority]
    sameParty: NotRequired[bool]
    sourceScheme: NotRequired[CookieSourceScheme]
    sourcePort: NotRequired[int]
    partitionKey: NotRequired[CookiePartitionKey]


class SetCookiesParams(TypedDict):
    """Parameters for setting multiple cookies."""

    cookies: list[SetCookieParams]


class SetExtraHTTPHeadersParams(TypedDict):
    """Parameters for setting extra HTTP headers."""

    headers: list[HeaderEntry]


class SetUserAgentOverrideParams(TypedDict):
    """Parameters for overriding user agent string."""

    userAgent: str
    acceptLanguage: NotRequired[str]
    platform: NotRequired[str]
    userAgentMetadata: NotRequired[UserAgentMetadata]


class SetBlockedURLsParams(TypedDict):
    """Parameters for blocking URLs from loading."""

    urls: list[str]


class SetAcceptedEncodingsParams(TypedDict):
    """Parameters for setting accepted content encodings."""

    encodings: list[ContentEncoding]


class SetAttachDebugStackParams(TypedDict):
    """Parameters for attaching a page script stack in requests."""

    enabled: bool


class SetCookieControlsParams(TypedDict):
    """Parameters for setting controls for third-party cookie access."""

    enableThirdPartyCookieRestriction: bool
    disableThirdPartyCookieMetadata: NotRequired[bool]
    disableThirdPartyCookieHeuristics: NotRequired[bool]


class StreamResourceContentParams(TypedDict):
    """Parameters for enabling streaming of the response."""

    requestId: str


class TakeResponseBodyForInterceptionAsStreamParams(TypedDict):
    """Parameters for taking response body for interception as a stream."""

    interceptionId: str


class SetRequestInterceptionParams(TypedDict):
    """Parameters for setting request interception patterns."""

    patterns: list[RequestPattern]


class AuthChallengeResponseParams(TypedDict):
    """Parameters for responding to an auth challenge."""

    response: str
    username: NotRequired[str]
    password: NotRequired[str]


class EnableReportingApiParams(TypedDict):
    """Parameters for enabling Reporting API."""

    enabled: bool


class GetSecurityIsolationStatusParams(TypedDict):
    frameId: NotRequired[str]


class LoadNetworkResourceParams(TypedDict):
    """Parameters for loading a network resource."""

    url: str
    options: LoadNetworkResourceOptions
    frameId: NotRequired[str]


class ReplayXHRParams(TypedDict):
    """Parameters for replaying an XMLHttpRequest."""

    requestId: str


class GetCookiesResult(TypedDict):
    """Response result for getCookies command."""

    cookies: list[Cookie]


class GetRequestPostDataResult(TypedDict):
    """Response result for getRequestPostData command."""

    postData: str


class GetResponseBodyResult(TypedDict):
    """Response result for getResponseBody command."""

    body: str
    base64Encoded: bool


class GetResponseBodyForInterceptionResult(TypedDict):
    """Response result for getResponseBodyForInterception command."""

    body: str
    base64Encoded: bool


class GetCertificateResult(TypedDict):
    """Response result for getCertificate command."""

    tableNames: list[str]


class SearchInResponseBodyResult(TypedDict):
    """Response result for searchInResponseBody command."""

    result: list[SearchMatch]


class SetCookieResult(TypedDict):
    """Response result for setCookie command."""

    success: bool


class StreamResourceContentResult(TypedDict):
    """Response result for streamResourceContent command."""

    bufferedData: str


class TakeResponseBodyForInterceptionAsStreamResult(TypedDict):
    """Response result for takeResponseBodyForInterceptionAsStream command."""

    stream: str


class CanClearBrowserCacheResult(TypedDict):
    """Response result for canClearBrowserCache command."""

    result: bool


class CanClearBrowserCookiesResult(TypedDict):
    """Response result for canClearBrowserCookies command."""

    result: bool


class CanEmulateNetworkConditionsResult(TypedDict):
    """Response result for canEmulateNetworkConditions command."""

    result: bool


class GetSecurityIsolationStatusResult(TypedDict):
    """Response result for getSecurityIsolationStatus command."""

    status: SecurityIsolationStatus


class LoadNetworkResourceResult(TypedDict):
    """Response result for loadNetworkResource command."""

    success: bool
    netError: NotRequired[float]
    netErrorName: NotRequired[str]
    httpStatusCode: NotRequired[float]
    stream: NotRequired[str]
    headers: NotRequired[list[HeaderEntry]]


GetCookiesResponse = Response[GetCookiesResult]
SetCookieResponse = Response[SetCookieResult]
GetRequestPostDataResponse = Response[GetRequestPostDataResult]
GetResponseBodyResponse = Response[GetResponseBodyResult]
GetResponseBodyForInterceptionResponse = Response[GetResponseBodyForInterceptionResult]
SearchInResponseBodyResponse = Response[SearchInResponseBodyResult]
StreamResourceContentResponse = Response[StreamResourceContentResult]
TakeResponseBodyForInterceptionAsStreamResponse = Response[
    TakeResponseBodyForInterceptionAsStreamResult
]
GetCertificateResponse = Response[GetCertificateResult]
CanClearBrowserCacheResponse = Response[CanClearBrowserCacheResult]
CanClearBrowserCookiesResponse = Response[CanClearBrowserCookiesResult]
CanEmulateNetworkConditionsResponse = Response[CanEmulateNetworkConditionsResult]
GetSecurityIsolationStatusResponse = Response[GetSecurityIsolationStatusResult]
LoadNetworkResourceResponse = Response[LoadNetworkResourceResult]


ClearBrowserCacheCommand = Command[EmptyParams, Response[EmptyResponse]]
ClearBrowserCookiesCommand = Command[EmptyParams, Response[EmptyResponse]]
ClearCookiesCommand = Command[DeleteCookiesParams, Response[EmptyResponse]]
DisableCommand = Command[EmptyParams, Response[EmptyResponse]]
EmulateNetworkConditionsCommand = Command[EmulateNetworkConditionsParams, Response[EmptyResponse]]
EnableCommand = Command[NetworkEnableParams, Response[EmptyResponse]]
GetCookiesCommand = Command[GetCookiesParams, GetCookiesResponse]
GetRequestPostDataCommand = Command[GetRequestPostDataParams, GetRequestPostDataResponse]
GetResponseBodyCommand = Command[GetResponseBodyParams, GetResponseBodyResponse]
SetCacheDisabledCommand = Command[SetCacheDisabledParams, Response[EmptyResponse]]
SetCookieCommand = Command[SetCookieParams, SetCookieResponse]
SetCookiesCommand = Command[SetCookiesParams, Response[EmptyResponse]]
SetExtraHTTPHeadersCommand = Command[SetExtraHTTPHeadersParams, Response[EmptyResponse]]
SetUserAgentOverrideCommand = Command[SetUserAgentOverrideParams, Response[EmptyResponse]]
ClearAcceptedEncodingsOverrideCommand = Command[EmptyParams, Response[EmptyResponse]]
EnableReportingApiCommand = Command[EnableReportingApiParams, Response[EmptyResponse]]
SearchInResponseBodyCommand = Command[SearchInResponseBodyParams, SearchInResponseBodyResponse]
SetBlockedURLsCommand = Command[SetBlockedURLsParams, Response[EmptyResponse]]
SetBypassServiceWorkerCommand = Command[SetBypassServiceWorkerParams, Response[EmptyResponse]]
GetCertificateCommand = Command[GetCertificateParams, GetCertificateResponse]
GetResponseBodyForInterceptionCommand = Command[
    GetResponseBodyForInterceptionParams, GetResponseBodyForInterceptionResponse
]
SetAcceptedEncodingsCommand = Command[SetAcceptedEncodingsParams, Response[EmptyResponse]]
SetAttachDebugStackCommand = Command[SetAttachDebugStackParams, Response[EmptyResponse]]
SetCookieControlsCommand = Command[SetCookieControlsParams, Response[EmptyResponse]]
StreamResourceContentCommand = Command[StreamResourceContentParams, StreamResourceContentResponse]
TakeResponseBodyForInterceptionAsStreamCommand = Command[
    TakeResponseBodyForInterceptionAsStreamParams, TakeResponseBodyForInterceptionAsStreamResponse
]
GetSecurityIsolationStatusCommand = Command[
    GetSecurityIsolationStatusParams, GetSecurityIsolationStatusResponse
]
LoadNetworkResourceCommand = Command[LoadNetworkResourceParams, LoadNetworkResourceResponse]
ReplayXHRCommand = Command[ReplayXHRParams, Response[EmptyResponse]]


================================================
FILE: pydoll/protocol/network/types.py
================================================
from enum import Enum

from typing_extensions import NotRequired, TypedDict

from pydoll.protocol.runtime.types import StackTrace
from pydoll.protocol.security.types import MixedContentType, SecurityState


class ResourceType(str, Enum):
    """Resource type as it was perceived by the rendering engine."""

    DOCUMENT = 'Document'
    STYLESHEET = 'Stylesheet'
    IMAGE = 'Image'
    MEDIA = 'Media'
    FONT = 'Font'
    SCRIPT = 'Script'
    TEXT_TRACK = 'TextTrack'
    XHR = 'XHR'
    FETCH = 'Fetch'
    PREFETCH = 'Prefetch'
    EVENT_SOURCE = 'EventSource'
    WEB_SOCKET = 'WebSocket'
    MANIFEST = 'Manifest'
    SIGNED_EXCHANGE = 'SignedExchange'
    PING = 'Ping'
    CSP_VIOLATION_REPORT = 'CSPViolationReport'
    PREFLIGHT = 'Preflight'
    FED_CM = 'FedCM'
    OTHER = 'Other'


LoaderId = str
RequestId = str
InterceptionId = str


class ErrorReason(str, Enum):
    """Network level fetch failure reason."""

    FAILED = 'Failed'
    ABORTED = 'Aborted'
    TIMED_OUT = 'TimedOut'
    ACCESS_DENIED = 'AccessDenied'
    CONNECTION_CLOSED = 'ConnectionClosed'
    CONNECTION_RESET = 'ConnectionReset'
    CONNECTION_REFUSED = 'ConnectionRefused'
    CONNECTION_ABORTED = 'ConnectionAborted'
    CONNECTION_FAILED = 'ConnectionFailed'
    NAME_NOT_RESOLVED = 'NameNotResolved'
    INTERNET_DISCONNECTED = 'InternetDisconnected'
    ADDRESS_UNREACHABLE = 'AddressUnreachable'
    BLOCKED_BY_CLIENT = 'BlockedByClient'
    BLOCKED_BY_RESPONSE = 'BlockedByResponse'


TimeSinceEpoch = float
MonotonicTime = float
Headers = dict[str, str]


class RequestMethod(str, Enum):
    """HTTP request method."""

    GET = 'GET'
    POST = 'POST'
    PUT = 'PUT'
    DELETE = 'DELETE'
    PATCH = 'PATCH'


class ConnectionType(str, Enum):
    """The underlying connection technology that the browser is supposedly using."""

    NONE = 'none'
    CELLULAR2G = 'cellular2g'
    CELLULAR3G = 'cellular3g'
    CELLULAR4G = 'cellular4g'
    BLUETOOTH = 'bluetooth'
    ETHERNET = 'ethernet'
    WIFI = 'wifi'
    WIMAX = 'wimax'
    OTHER = 'other'


class CookieSameSite(str, Enum):
    """Represents the cookie's 'SameSite' status"""

    STRICT = 'Strict'
    LAX = 'Lax'
    NONE = 'None'


class CookiePriority(str, Enum):
    """Represents the cookie's 'Priority' status"""

    LOW = 'Low'
    MEDIUM = 'Medium'
    HIGH = 'High'


class CookieSourceScheme(str, Enum):
    """
    Represents the source scheme of the origin that originally set the cookie.
    A value of "Unset" allows protocol clients to emulate legacy cookie scope for the scheme.
    This is a temporary ability and it will be removed in the future."""

    UNSET = 'Unset'
    NON_SECURE = 'NonSecure'
    SECURE = 'Secure'


class ResourceTiming(TypedDict):
    """Timing information for the request."""

    requestTime: float
    proxyStart: float
    proxyEnd: float
    dnsStart: float
    dnsEnd: float
    connectStart: float
    connectEnd: float
    sslStart: float
    sslEnd: float
    workerStart: float
    workerReady: float
    workerFetchStart: float
    workerRespondWithSettled: float
    workerRouterEvaluationStart: NotRequired[float]
    workerCacheLookupStart: NotRequired[float]
    sendStart: float
    sendEnd: float
    pushStart: float
    pushEnd: float
    receiveHeadersStart: float
    receiveHeadersEnd: float


class ResourcePriority(str, Enum):
    """Loading priority of a resource request."""

    VERY_LOW = 'VeryLow'
    LOW = 'Low'
    MEDIUM = 'Medium'
    HIGH = 'High'
    VERY_HIGH = 'VeryHigh'


class PostDataEntry(TypedDict):
    """Post data entry for HTTP request"""

    bytes: NotRequired[str]


class Request(TypedDict):
    """HTTP request data."""

    url: str
    urlFragment: NotRequired[str]
    method: str
    headers: 'Headers'
    postData: NotRequired[str]
    hasPostData: NotRequired[bool]
    postDataEntries: NotRequired[list['PostDataEntry']]
    mixedContentType: NotRequired['MixedContentType']
    initialPriority: 'ResourcePriority'
    referrerPolicy: str
    isLinkPreload: NotRequired[bool]
    trustTokenParams: NotRequired['TrustTokenParams']
    isSameSite: NotRequired[bool]


class SignedCertificateTimestamp(TypedDict):
    """Details of a signed certificate timestamp (SCT)."""

    status: str
    origin: str
    logDescription: str
    logId: str
    timestamp: float
    hashAlgorithm: str
    signatureAlgorithm: str
    signatureData: str


class SecurityDetails(TypedDict):
    """Security details about a request."""

    protocol: str
    keyExchange: str
    keyExchangeGroup: NotRequired[str]
    cipher: str
    mac: NotRequired[str]
    certificateId: int
    subjectName: str
    sanList: list[str]
    issuer: str
    validFrom: 'TimeSinceEpoch'
    validTo: 'TimeSinceEpoch'
    signedCertificateTimestampList: list['SignedCertificateTimestamp']
    certificateTransparencyCompliance: 'CertificateTransparencyCompliance'
    serverSignatureAlgorithm: NotRequired[int]
    encryptedClientHello: bool


class CertificateTransparencyCompliance(str, Enum):
    """Whether the request complied with Certificate Transparency policy."""

    UNKNOWN = 'unknown'
    NOT_COMPLIANT = 'not-compliant'
    COMPLIANT = 'compliant'


class BlockedReason(str, Enum):
    """The reason why request was blocked."""

    OTHER = 'other'
    CSP = 'csp'
    MIXED_CONTENT = 'mixed-content'
    ORIGIN = 'origin'
    INSPECTOR = 'inspector'
    INTEGRITY = 'integrity'
    SUBRESOURCE_FILTER = 'subresource-filter'
    CONTENT_TYPE = 'content-type'
    COEP_FRAME_RESOURCE_NEEDS_COEP_HEADER = 'coep-frame-resource-needs-coep-header'
    COOP_SANDBOXED_IFRAME_CANNOT_NAVIGATE_TO_COOP_PAGE = (
        'coop-sandboxed-iframe-cannot-navigate-to-coop-page'
    )
    CORP_NOT_SAME_ORIGIN = 'corp-not-same-origin'
    CORP_NOT_SAME_ORIGIN_AFTER_DEFAULTED_TO_SAME_ORIGIN_BY_COEP = (
        'corp-not-same-origin-after-defaulted-to-same-origin-by-coep'
    )
    CORP_NOT_SAME_ORIGIN_AFTER_DEFAULTED_TO_SAME_ORIGIN_BY_DIP = (
        'corp-not-same-origin-after-defaulted-to-same-origin-by-dip'
    )
    CORP_NOT_SAME_ORIGIN_AFTER_DEFAULTED_TO_SAME_ORIGIN_BY_COEP_AND_DIP = (
        'corp-not-same-origin-after-defaulted-to-same-origin-by-coep-and-dip'
    )
    CORP_NOT_SAME_SITE = 'corp-not-same-site'
    SRI_MESSAGE_SIGNATURE_MISMATCH = 'sri-message-signature-mismatch'


class CorsError(str, Enum):
    """The reason why request was blocked."""

    DISALLOWED_BY_MODE = 'DisallowedByMode'
    INVALID_RESPONSE = 'InvalidResponse'
    WILDCARD_ORIGIN_NOT_ALLOWED = 'WildcardOriginNotAllowed'
    MISSING_ALLOW_ORIGIN_HEADER = 'MissingAllowOriginHeader'
    MULTIPLE_ALLOW_ORIGIN_VALUES = 'MultipleAllowOriginValues'
    INVALID_ALLOW_ORIGIN_VALUE = 'InvalidAllowOriginValue'
    ALLOW_ORIGIN_MISMATCH = 'AllowOriginMismatch'
    INVALID_ALLOW_CREDENTIALS = 'InvalidAllowCredentials'
    CORS_DISABLED_SCHEME = 'CorsDisabledScheme'
    PREFLIGHT_INVALID_STATUS = 'PreflightInvalidStatus'
    PREFLIGHT_DISALLOWED_REDIRECT = 'PreflightDisallowedRedirect'
    PREFLIGHT_WILDCARD_ORIGIN_NOT_ALLOWED = 'PreflightWildcardOriginNotAllowed'
    PREFLIGHT_MISSING_ALLOW_ORIGIN_HEADER = 'PreflightMissingAllowOriginHeader'
    PREFLIGHT_MULTIPLE_ALLOW_ORIGIN_VALUES = 'PreflightMultipleAllowOriginValues'
    PREFLIGHT_INVALID_ALLOW_ORIGIN_VALUE = 'PreflightInvalidAllowOriginValue'
    PREFLIGHT_ALLOW_ORIGIN_MISMATCH = 'PreflightAllowOriginMismatch'
    PREFLIGHT_INVALID_ALLOW_CREDENTIALS = 'PreflightInvalidAllowCredentials'
    PREFLIGHT_MISSING_ALLOW_EXTERNAL = 'PreflightMissingAllowExternal'
    PREFLIGHT_INVALID_ALLOW_EXTERNAL = 'PreflightInvalidAllowExternal'
    PREFLIGHT_MISSING_ALLOW_PRIVATE_NETWORK = 'PreflightMissingAllowPrivateNetwork'
    PREFLIGHT_INVALID_ALLOW_PRIVATE_NETWORK = 'PreflightInvalidAllowPrivateNetwork'
    INVALID_ALLOW_METHODS_PREFLIGHT_RESPONSE = 'InvalidAllowMethodsPreflightResponse'
    INVALID_ALLOW_HEADERS_PREFLIGHT_RESPONSE = 'InvalidAllowHeadersPreflightResponse'
    METHOD_DISALLOWED_BY_PREFLIGHT_RESPONSE = 'MethodDisallowedByPreflightResponse'
    HEADER_DISALLOWED_BY_PREFLIGHT_RESPONSE = 'HeaderDisallowedByPreflightResponse'
    REDIRECT_CONTAINS_CREDENTIALS = 'RedirectContainsCredentials'
    INSECURE_PRIVATE_NETWORK = 'InsecurePrivateNetwork'
    INVALID_PRIVATE_NETWORK_ACCESS = 'InvalidPrivateNetworkAccess'
    UNEXPECTED_PRIVATE_NETWORK_ACCESS = 'UnexpectedPrivateNetworkAccess'
    NO_CORS_REDIRECT_MODE_NOT_FOLLOW = 'NoCorsRedirectModeNotFollow'
    PREFLIGHT_MISSING_PRIVATE_NETWORK_ACCESS_ID = 'PreflightMissingPrivateNetworkAccessId'
    PREFLIGHT_MISSING_PRIVATE_NETWORK_ACCESS_NAME = 'PreflightMissingPrivateNetworkAccessName'
    PRIVATE_NETWORK_ACCESS_PERMISSION_UNAVAILABLE = 'PrivateNetworkAccessPermissionUnavailable'
    PRIVATE_NETWORK_ACCESS_PERMISSION_DENIED = 'PrivateNetworkAccessPermissionDenied'
    LOCAL_NETWORK_ACCESS_PERMISSION_DENIED = 'LocalNetworkAccessPermissionDenied'


class CorsErrorStatus(TypedDict):
    corsError: CorsError
    failedParameter: str


class ServiceWorkerResponseSource(str, Enum):
    """Source of serviceworker response."""

    CACHE_STORAGE = 'cache-storage'
    HTTP_CACHE = 'http-cache'
    FALLBACK_CODE = 'fallback-code'
    NETWORK = 'network'


class TrustTokenParams(TypedDict):
    """
    Determines what type of Trust Token operation is executed and depending on the type,
    some additional parameters. The values are specified in
    third_party/blink/renderer/core/fetch/trust_token.idl.
    """

    operation: 'TrustTokenOperationType'
    refreshPolicy: str
    issuers: NotRequired[list[str]]


class TrustTokenOperationType(str, Enum):
    ISSUANCE = 'Issuance'
    REDEMPTION = 'Redemption'
    SIGNING = 'Signing'


class AlternateProtocolUsage(str, Enum):
    """The reason why Chrome uses a specific transport protocol for HTTP semantics."""

    ALTERNATIVE_JOB_WON_WITHOUT_RACE = 'alternativeJobWonWithoutRace'
    ALTERNATIVE_JOB_WON_RACE = 'alternativeJobWonRace'
    MAIN_JOB_WON_RACE = 'mainJobWonRace'
    MAPPING_MISSING = 'mappingMissing'
    BROKEN = 'broken'
    DNS_ALPN_H3_JOB_WON_WITHOUT_RACE = 'dnsAlpnH3JobWonWithoutRace'
    DNS_ALPN_H3_JOB_WON_RACE = 'dnsAlpnH3JobWonRace'
    UNSPECIFIED_REASON = 'unspecifiedReason'


class ServiceWorkerRouterSource(str, Enum):
    """Source of service worker router."""

    NETWORK = 'network'
    CACHE = 'cache'
    FETCH_EVENT = 'fetch-event'
    RACE_NETWORK_AND_FETCH_HANDLER = 'race-network-and-fetch-handler'


class ServiceWorkerRouterInfo(TypedDict):
    ruleIdMatched: NotRequired[int]
    matchedSourceType: NotRequired['ServiceWorkerRouterSource']
    actualSourceType: NotRequired['ServiceWorkerRouterSource']


class Response(TypedDict):
    """HTTP response data."""

    url: str
    status: int
    statusText: str
    headers: 'Headers'
    headersText: NotRequired[str]
    mimeType: str
    charset: str
    requestHeaders: NotRequired['Headers']
    requestHeadersText: NotRequired[str]
    connectionReused: bool
    connectionId: float
    remoteIPAddress: NotRequired[str]
    remotePort: NotRequired[int]
    fromDiskCache: NotRequired[bool]
    fromServiceWorker: NotRequired[bool]
    fromPrefetchCache: NotRequired[bool]
    fromEarlyHints: NotRequired[bool]
    serviceWorkerRouterInfo: NotRequired['ServiceWorkerRouterInfo']
    encodedDataLength: float
    timing: NotRequired['ResourceTiming']
    serviceWorkerResponseSource: NotRequired[ServiceWorkerResponseSource]
    responseTime: NotRequired['TimeSinceEpoch']
    cacheStorageCacheName: NotRequired[str]
    protocol: NotRequired[str]
    alternateProtocolUsage: NotRequired[AlternateProtocolUsage]
    securityState: SecurityState
    securityDetails: NotRequired['SecurityDetails']
    isIpProtectionUsed: NotRequired[bool]


class WebSocketRequest(TypedDict):
    """WebSocket request data."""

    headers: 'Headers'


class WebSocketResponse(TypedDict):
    """WebSocket response data."""

    status: int
    statusText: str
    headers: 'Headers'
    headersText: NotRequired[str]
    requestHeaders: NotRequired['Headers']
    requestHeadersText: NotRequired[str]


class WebSocketFrame(TypedDict):
    """
    WebSocket message data. This represents an entire WebSocket message,
    not just a fragmented frame as the name suggests.
    """

    opcode: float
    mask: bool
    payloadData: str


class CachedResource(TypedDict):
    """Information about the cached resource."""

    url: str
    type: ResourceType
    response: NotRequired['Response']
    bodySize: float


class Initiator(TypedDict):
    """Information about the request initiator."""

    type: str
    stack: NotRequired[StackTrace]
    url: NotRequired[str]
    lineNumber: NotRequired[float]
    columnNumber: NotRequired[float]
    requestId: NotRequired[RequestId]


class CookiePartitionKey(TypedDict):
    """
    cookiePartitionKey object. The representation of the components of the key that are created
    by the cookiePartitionKey class contained in net/cookies/cookie_partition_key.h.
    """

    topLevelSite: str
    hasCrossSiteAncestor: bool


class Cookie(TypedDict):
    """Cookie object"""

    name: str
    value: str
    domain: str
    path: str
    expires: float
    size: int
    httpOnly: bool
    secure: bool
    session: bool
    sameSite: NotRequired[CookieSameSite]
    priority: NotRequired[CookiePriority]
    sameParty: NotRequired[bool]
    sourceScheme: NotRequired[CookieSourceScheme]
    sourcePort: int
    partitionKey: NotRequired['CookiePartitionKey']


class SetCookieBlockedReason(str, Enum):
    """Types of reasons why a cookie may not be stored from a response."""

    SECURE_ONLY = 'SecureOnly'
    SAME_SITE_STRICT = 'SameSiteStrict'
    SAME_SITE_LAX = 'SameSiteLax'
    SAME_SITE_UNSPECIFIED_TREATED_AS_LAX = 'SameSiteUnspecifiedTreatedAsLax'
    SAME_SITE_NONE_INSECURE = 'SameSiteNoneInsecure'
    USER_PREFERENCES = 'UserPreferences'
    THIRD_PARTY_PHASEOUT = 'ThirdPartyPhaseout'
    THIRD_PARTY_BLOCKED_IN_FIRST_PARTY_SET = 'ThirdPartyBlockedInFirstPartySet'
    SYNTAX_ERROR = 'SyntaxError'
    SCHEME_NOT_SUPPORTED = 'SchemeNotSupported'
    OVERWRITE_SECURE = 'OverwriteSecure'
    INVALID_DOMAIN = 'InvalidDomain'
    INVALID_PREFIX = 'InvalidPrefix'
    UNKNOWN_ERROR = 'UnknownError'
    SCHEMEFUL_SAME_SITE_STRICT = 'SchemefulSameSiteStrict'
    SCHEMEFUL_SAME_SITE_LAX = 'SchemefulSameSiteLax'
    SCHEMEFUL_SAME_SITE_UNSPECIFIED_TREATED_AS_LAX = 'SchemefulSameSiteUnspecifiedTreatedAsLax'
    SAME_PARTY_FROM_CROSS_PARTY_CONTEXT = 'SamePartyFromCrossPartyContext'
    SAME_PARTY_CONFLICTS_WITH_OTHER_ATTRIBUTES = 'SamePartyConflictsWithOtherAttributes'
    NAME_VALUE_PAIR_EXCEEDS_MAX_SIZE = 'NameValuePairExceedsMaxSize'
    DISALLOWED_CHARACTER = 'DisallowedCharacter'
    NO_COOKIE_CONTENT = 'NoCookieContent'


class CookieBlockedReason(str, Enum):
    """Types of reasons why a cookie may not be sent with a request."""

    SECURE_ONLY = 'SecureOnly'
    NOT_ON_PATH = 'NotOnPath'
    DOMAIN_MISMATCH = 'DomainMismatch'
    SAME_SITE_STRICT = 'SameSiteStrict'
    SAME_SITE_LAX = 'SameSiteLax'
    SAME_SITE_UNSPECIFIED_TREATED_AS_LAX = 'SameSiteUnspecifiedTreatedAsLax'
    SAME_SITE_NONE_INSECURE = 'SameSiteNoneInsecure'
    USER_PREFERENCES = 'UserPreferences'
    THIRD_PARTY_PHASEOUT = 'ThirdPartyPhaseout'
    THIRD_PARTY_BLOCKED_IN_FIRST_PARTY_SET = 'ThirdPartyBlockedInFirstPartySet'
    UNKNOWN_ERROR = 'UnknownError'
    SCHEMEFUL_SAME_SITE_STRICT = 'SchemefulSameSiteStrict'
    SCHEMEFUL_SAME_SITE_LAX = 'SchemefulSameSiteLax'
    SCHEMEFUL_SAME_SITE_UNSPECIFIED_TREATED_AS_LAX = 'SchemefulSameSiteUnspecifiedTreatedAsLax'
    SAME_PARTY_FROM_CROSS_PARTY_CONTEXT = 'SamePartyFromCrossPartyContext'
    NAME_VALUE_PAIR_EXCEEDS_MAX_SIZE = 'NameValuePairExceedsMaxSize'
    PORT_MISMATCH = 'PortMismatch'
    SCHEME_MISMATCH = 'SchemeMismatch'
    ANONYMOUS_CONTEXT = 'AnonymousContext'


class CookieExemptionReason(str, Enum):
    """
    Types of reasons why a cookie should have been blocked by 3PCD but is exempted for the request.
    """

    NONE = 'None'
    USER_SETTING = 'UserSetting'
    TPCD_METADATA = 'TPCDMetadata'
    TPCD_DEPRECATION_TRIAL = 'TPCDDeprecationTrial'
    TOP_LEVEL_TPCD_DEPRECATION_TRIAL = 'TopLevelTPCDDeprecationTrial'
    TPCD_HEURISTICS = 'TPCDHeuristics'
    ENTERPRISE_POLICY = 'EnterprisePolicy'
    STORAGE_ACCESS = 'StorageAccess'
    TOP_LEVEL_STORAGE_ACCESS = 'TopLevelStorageAccess'
    SCHEME = 'Scheme'
    SAME_SITE_NONE_COOKIES_IN_SANDBOX = 'SameSiteNoneCookiesInSandbox'


class BlockedSetCookieWithReason(TypedDict):
    """A cookie which was not stored from a response with the corresponding reason."""

    blockedReasons: list[SetCookieBlockedReason]
    cookieLine: str
    cookie: NotRequired['Cookie']


class ExemptedSetCookieWithReason(TypedDict):
    """
    A cookie should have been blocked by 3PCD but is exempted and stored from a response with
    the corresponding reason. A cookie could only have at most one exemption reason.
    """

    exemptionReason: CookieExemptionReason
    cookieLine: str
    cookie: 'Cookie'


class AssociatedCookie(TypedDict):
    """
    A cookie associated with the request which may or may not be sent with it.
    Includes the cookies itself and reasons for blocking or exemption.
    """

    cookie: 'Cookie'
    blockedReasons: list[CookieBlockedReason]
    exemptionReason: NotRequired[CookieExemptionReason]


class CookieParam(TypedDict):
    """Cookie parameter object"""

    name: str
    value: str
    url: NotRequired[str]
    domain: NotRequired[str]
    path: NotRequired[str]
    secure: NotRequired[bool]
    httpOnly: NotRequired[bool]
    sameSite: NotRequired[CookieSameSite]
    expires: NotRequired['TimeSinceEpoch']
    priority: NotRequired[CookiePriority]
    sameParty: NotRequired[bool]
    sourceScheme: NotRequired[CookieSourceScheme]
    sourcePort: NotRequired[int]
    partitionKey: NotRequired['CookiePartitionKey']


class AuthChallenge(TypedDict):
    """Authorization challenge for HTTP status code 401 or 407."""

    source: NotRequired[str]
    origin: str
    scheme: str
    realm: str


class AuthChallengeResponse(TypedDict):
    """Response to an AuthChallenge."""

    response: str
    username: NotRequired[str]
    password: NotRequired[str]


class InterceptionStage(str, Enum):
    """
    Stages of the interception to begin intercepting. Request will intercept before the request
    is sent. Response will intercept after the response is received.
    """

    REQUEST = 'Request'
    HEADERS_RECEIVED = 'HeadersReceived'


class RequestPattern(TypedDict):
    """Request pattern for interception."""

    urlPattern: NotRequired[str]
    resourceType: NotRequired[ResourceType]
    interceptionStage: NotRequired[InterceptionStage]


class SignedExchangeSignature(TypedDict):
    """Information about a signed exchange signature."""

    label: str
    signature: str
    integrity: str
    certUrl: NotRequired[str]
    certSha256: NotRequired[str]
    validityUrl: str
    date: int
    expires: int
    certificates: NotRequired[list[str]]


class SignedExchangeHeader(TypedDict):
    """Information about a signed exchange header."""

    requestUrl: str
    responseCode: int
    responseHeaders: 'Headers'
    signatures: list[SignedExchangeSignature]
    headerIntegrity: str


class SignedExchangeErrorField(str, Enum):
    """Field type for a signed exchange related error."""

    SIGNATURE_SIG = 'signatureSig'
    SIGNATURE_INTEGRITY = 'signatureIntegrity'
    SIGNATURE_CERT_URL = 'signatureCertUrl'
    SIGNATURE_CERT_SHA256 = 'signatureCertSha256'
    SIGNATURE_VALIDITY_URL = 'signatureValidityUrl'
    SIGNATURE_TIMESTAMPS = 'signatureTimestamps'


class SignedExchangeError(TypedDict):
    """Information about a signed exchange response."""

    message: str
    signatureIndex: NotRequired[int]
    errorField: NotRequired[SignedExchangeErrorField]


class SignedExchangeInfo(TypedDict):
    """Information about a signed exchange response."""

    outerResponse: 'Response'
    hasExtraInfo: bool
    header: NotRequired[SignedExchangeHeader]
    securityDetails: NotRequired['SecurityDetails']
    errors: NotRequired[list[SignedExchangeError]]


class ContentEncoding(str, Enum):
    """List of content encodings supported by the backend."""

    DEFLATE = 'deflate'
    GZIP = 'gzip'
    BR = 'br'
    ZSTD = 'zstd'


class DirectSocketDnsQueryType(str, Enum):
    IPV4 = 'ipv4'
    IPV6 = 'ipv6'


class DirectTCPSocketOptions(TypedDict):
    noDelay: bool
    keepAliveDelay: NotRequired[float]
    sendBufferSize: NotRequired[float]
    receiveBufferSize: NotRequired[float]
    dnsQueryType: NotRequired[DirectSocketDnsQueryType]


class DirectUDPSocketOptions(TypedDict):
    remoteAddr: NotRequired[str]
    remotePort: NotRequired[int]
    localAddr: NotRequired[str]
    localPort: NotRequired[int]
    dnsQueryType: NotRequired[DirectSocketDnsQueryType]
    sendBufferSize: NotRequired[float]
    receiveBufferSize: NotRequired[float]


class DirectUDPMessage(TypedDict):
    data: str
    remoteAddr: NotRequired[str]
    remotePort: NotRequired[int]


class PrivateNetworkRequestPolicy(str, Enum):
    ALLOW = 'Allow'
    BLOCK_FROM_INSECURE_TO_MORE_PRIVATE = 'BlockFromInsecureToMorePrivate'
    WARN_FROM_INSECURE_TO_MORE_PRIVATE = 'WarnFromInsecureToMorePrivate'
    PREFLIGHT_BLOCK = 'PreflightBlock'
    PREFLIGHT_WARN = 'PreflightWarn'


class IPAddressSpace(str, Enum):
    LOOPBACK = 'Loopback'
    LOCAL = 'Local'
    PUBLIC = 'Public'
    UNKNOWN = 'Unknown'


class ConnectTiming(TypedDict):
    requestTime: float


class ClientSecurityState(TypedDict):
    initiatorIsSecureContext: bool
    initiatorIPAddressSpace: IPAddressSpace
    privateNetworkRequestPolicy: PrivateNetworkRequestPolicy


class CrossOriginOpenerPolicyValue(str, Enum):
    SAME_ORIGIN = 'SameOrigin'
    SAME_ORIGIN_ALLOW_POPUPS = 'SameOriginAllowPopups'
    RESTRICT_PROPERTIES = 'RestrictProperties'
    UNSAFE_NONE = 'UnsafeNone'
    SAME_ORIGIN_PLUS_COEP = 'SameOriginPlusCoep'
    RESTRICT_PROPERTIES_PLUS_COEP = 'RestrictPropertiesPlusCoep'
    NO_OPENER_ALLOW_POPUPS = 'NoopenerAllowPopups'


class CrossOriginOpenerPolicyStatus(TypedDict):
    value: CrossOriginOpenerPolicyValue
    reportOnlyValue: CrossOriginOpenerPolicyValue
    reportingEndpoint: NotRequired[str]
    reportOnlyReportingEndpoint: NotRequired[str]


class CrossOriginEmbedderPolicyValue(str, Enum):
    NONE = 'None'
    CREDENTIALLESS = 'Credentialless'
    REQUIRE_CORP = 'RequireCorp'


class CrossOriginEmbedderPolicyStatus(TypedDict):
    value: CrossOriginEmbedderPolicyValue
    reportOnlyValue: CrossOriginEmbedderPolicyValue
    reportingEndpoint: NotRequired[str]
    reportOnlyReportingEndpoint: NotRequired[str]


class ContentSecurityPolicySource(str, Enum):
    HTTP = 'HTTP'
    META = 'Meta'


class ContentSecurityPolicyStatus(TypedDict):
    effectiveDirectives: str
    isEnforced: bool
    source: ContentSecurityPolicySource


class SecurityIsolationStatus(TypedDict):
    coop: NotRequired[CrossOriginOpenerPolicyStatus]
    coep: NotRequired[CrossOriginEmbedderPolicyStatus]
    csp: NotRequired[list[ContentSecurityPolicyStatus]]


class ReportStatus(str, Enum):
    """The status of a Reporting API report."""

    QUEUED = 'Queued'
    PENDING = 'Pending'
    MARKED_FOR_REMOVAL = 'MarkedForRemoval'
    SUCCESS = 'Success'


class ReportId(str):
    pass


class ReportingApiReport(TypedDict):
    """An object representing a report generated by the Reporting API."""

    id: ReportId
    initiatorUrl: str
    destination: str
    type: str
    timestamp: TimeSinceEpoch
    depth: int
    completedAttempts: int
    body: dict
    status: ReportStatus


class ReportingApiEndpoint(TypedDict):
    url: str
    groupName: str


class LoadNetworkResourcePageResult(TypedDict):
    """An object providing the result of a network resource load."""

    success: bool
    netError: NotRequired[float]
    netErrorName: NotRequired[str]
    httpStatusCode: NotRequired[float]
    stream: NotRequired[str]
    headers: NotRequired['Headers']


class LoadNetworkResourceOptions(TypedDict):
    """An options object that may be extended later to better support CORS, CORB and streaming."""

    disableCache: bool
    includeCredentials: bool


================================================
FILE: pydoll/protocol/page/__init__.py
================================================
"""Page domain implementation."""


================================================
FILE: pydoll/protocol/page/events.py
================================================
from enum import Enum

from typing_extensions import NotRequired, TypedDict

from pydoll.protocol.base import CDPEvent
from pydoll.protocol.dom.types import BackendNodeId
from pydoll.protocol.network.types import LoaderId, MonotonicTime
from pydoll.protocol.page.types import (
    BackForwardCacheNotRestoredExplanation,
    BackForwardCacheNotRestoredExplanationTree,
    ClientNavigationDisposition,
    ClientNavigationReason,
    DialogType,
    Frame,
    FrameId,
    NavigationType,
    ScreencastFrameMetadata,
)
from pydoll.protocol.runtime.types import StackTrace


class PageEvent(str, Enum):
    """
    Events from the Page domain of the Chrome DevTools Protocol.

    This enumeration contains the names of Page-related events that can be
    received from the Chrome DevTools Protocol. These events provide information
    about page lifecycle, frame navigation, JavaScript dialogs, and other
    page-related activities.
    """

    DOM_CONTENT_EVENT_FIRED = 'Page.domContentEventFired'
    """
    Fired when DOMContentLoaded event is fired.

    Args:
        timestamp (Network.MonotonicTime): Timestamp when the event occurred.
    """

    FILE_CHOOSER_OPENED = 'Page.fileChooserOpened'
    """
    Emitted only when page.interceptFileChooser is enabled.

    Args:
        frameId (FrameId): Id of the frame containing input node.
        mode (str): Input mode. Allowed Values: selectSingle, selectMultiple
        backendNodeId (DOM.BackendNodeId): Input node id. Only present for file choosers
            opened via an <input type="file"> element.
    """

    FRAME_ATTACHED = 'Page.frameAttached'
    """
    Fired when frame has been attached to its parent.

    Args:
        frameId (FrameId): Id of the frame that has been attached.
        parentFrameId (FrameId): Parent frame identifier.
        stack (Runtime.StackTrace): JavaScript stack trace of when frame was attached,
            only set if frame initiated from script.
    """

    FRAME_DETACHED = 'Page.frameDetached'
    """
    Fired when frame has been detached from its parent.

    Args:
        frameId (FrameId): Id of the frame that has been detached.
        reason (str): Reason why the frame was detached.
            Allowed Values: remove, swap
    """

    FRAME_NAVIGATED = 'Page.frameNavigated'
    """
    Fired once navigation of the frame has completed. Frame is now associated with the new loader.

    Args:
        frame (Frame): Frame object.
        type (NavigationType): Type of navigation.
    """

    INTERSTITIAL_HIDDEN = 'Page.interstitialHidden'
    """
    Fired when interstitial page was hidden.
    """

    INTERSTITIAL_SHOWN = 'Page.interstitialShown'
    """
    Fired when interstitial page was shown.
    """

    JAVASCRIPT_DIALOG_CLOSED = 'Page.javascriptDialogClosed'
    """
    Fired when a JavaScript initiated dialog (alert, confirm, prompt, or onbeforeunload)
    has been closed.

    Args:
        frameId (FrameId): Frame id.
        result (bool): Whether dialog was confirmed.
        userInput (str): User input in case of prompt.
    """

    JAVASCRIPT_DIALOG_OPENING = 'Page.javascriptDialogOpening'
    """
    Fired when a JavaScript initiated dialog (alert, confirm, prompt, or onbeforeunload)
    is about to open.

    Args:
        url (str): Frame url.
        frameId (FrameId): Frame id.
        message (str): Message that will be displayed by the dialog.
        type (DialogType): Dialog type.
        hasBrowserHandler (bool): True if browser is capable showing or acting on the given dialog.
            When browser has no dialog handler for given target, calling alert while Page domain
            is engaged will stall the page execution. Execution can be resumed via calling
            Page.handleJavaScriptDialog.
        defaultPrompt (str): Default dialog prompt.
    """

    LIFECYCLE_EVENT = 'Page.lifecycleEvent'
    """
    Fired for lifecycle events (navigation, load, paint, etc) in the current target
    (including local frames).

    Args:
        frameId (FrameId): Id of the frame.
        loaderId (Network.LoaderId): Loader identifier. Empty string if the request is
            fetched from worker.
        name (str): Lifecycle event name.
        timestamp (Network.MonotonicTime): Timestamp when the event occurred.
    """

    LOAD_EVENT_FIRED = 'Page.loadEventFired'
    """
    Fired when the page load event has fired.

    Args:
        timestamp (Network.MonotonicTime): Timestamp when the event occurred.
    """

    WINDOW_OPEN = 'Page.windowOpen'
    """
    Fired when a new window is going to be opened, via window.open(), link click,
    form submission, etc.

    Args:
        url (str): The URL for the new window.
        windowName (str): Window name.
        windowFeatures (array[str]): An array of enabled window features.
        userGesture (bool): Whether or not it was triggered by user gesture.
    """

    BACK_FORWARD_CACHE_NOT_USED = 'Page.backForwardCacheNotUsed'
    """
    Fired for failed bfcache history navigations if BackForwardCache feature is enabled.
    Do not assume any ordering with the Page.frameNavigated event. This event is fired
    only for main-frame history navigation where the document changes (non-same-document
    navigations), when bfcache navigation fails.

    Args:
        loaderId (Network.LoaderId): The loader id for the associated navigation.
        frameId (FrameId): The frame id of the associated frame.
        notRestoredExplanations (array[BackForwardCacheNotRestoredExplanation]): Array of reasons
            why the page could not be cached. This must not be empty.
        notRestoredExplanationsTree (BackForwardCacheNotRestoredExplanationTree): Tree structure
            of reasons why the page could not be cached for each frame.
    """

    COMPILATION_CACHE_PRODUCED = 'Page.compilationCacheProduced'
    """
    Issued for every compilation cache generated. Is only available if
    Page.setGenerateCompilationCache is enabled.

    Args:
        url (str): The URL of the document whose compilation cache was produced.
        data (str): Base64-encoded data (Encoded as a base64 string when passed over JSON).
    """

    DOCUMENT_OPENED = 'Page.documentOpened'
    """
    Fired when opening document to write to.

    Args:
        frame (Frame): Frame object.
    """

    FRAME_REQUESTED_NAVIGATION = 'Page.frameRequestedNavigation'
    """
    Fired when a renderer-initiated navigation is requested.
    Navigation may still be cancelled after the event is issued.

    Args:
        frameId (FrameId): Id of the frame that is being navigated.
        reason (ClientNavigationReason): The reason for the navigation.
        url (str): The destination URL for the requested navigation.
        disposition (ClientNavigationDisposition): The disposition for the navigation.
    """

    FRAME_RESIZED = 'Page.frameResized'
    """
    Fired when frame has been resized.
    """

    FRAME_STARTED_LOADING = 'Page.frameStartedLoading'
    """
    Fired when frame has started loading.

    Args:
        frameId (FrameId): Id of the frame that has started loading.
    """

    FRAME_STARTED_NAVIGATING = 'Page.frameStartedNavigating'
    """
    Fired when a navigation starts. This event is fired for both renderer-initiated
    and browser-initiated navigations. For renderer-initiated navigations, the event
    is fired after frameRequestedNavigation. Navigation may still be cancelled after
    the event is issued. Multiple events can be fired for a single navigation, for example,
    when a same-document navigation becomes a cross-document navigation (such as in the
    case of a frameset).

    Args:
        frameId (FrameId): ID of the frame that is being navigated.
        url (str): The URL the navigation started with. The final URL can be different.
        loaderId (Network.LoaderId): Loader identifier. Even though it is present in case
            of same-document navigation, the previously committed loaderId would not change
            unless the navigation changes from a same-document to a cross-document navigation.
        navigationType (str): Type of navigation.
            Allowed Values: reload, reloadBypassingCache, restore, restoreWithPost,
            historySameDocument, historyDifferentDocument, sameDocument, differentDocument
    """

    FRAME_STOPPED_LOADING = 'Page.frameStoppedLoading'
    """
    Fired when frame has stopped loading.

    Args:
        frameId (FrameId): Id of the frame that has stopped loading.
    """

    FRAME_SUBTREE_WILL_BE_DETACHED = 'Page.frameSubtreeWillBeDetached'
    """
    Fired before frame subtree is detached. Emitted before any frame of the subtree
    is actually detached.

    Args:
        frameId (FrameId): Id of the frame that is the root of the subtree that will be detached.
    """

    NAVIGATED_WITHIN_DOCUMENT = 'Page.navigatedWithinDocument'
    """
    Fired when same-document navigation happens, e.g. due to history API usage or anchor navigation.

    Args:
        frameId (FrameId): Id of the frame.
        url (str): Frame's new url.
        navigationType (str): Navigation type.
            Allowed Values: fragment, historyApi, other
    """

    SCREENCAST_FRAME = 'Page.screencastFrame'
    """
    Compressed image data requested by the startScreencast.

    Args:
        data (str): Base64-encoded compressed image.
        metadata (ScreencastFrameMetadata): Screencast frame metadata.
        sessionId (int): Frame number.
    """

    SCREENCAST_VISIBILITY_CHANGED = 'Page.screencastVisibilityChanged'
    """
    Fired when the page with currently enabled screencast was shown or hidden.

    Args:
        visible (bool): True if the page is visible.
    """
    DOWNLOAD_WILL_BEGIN = 'Page.downloadWillBegin'
    DOWNLOAD_PROGRESS = 'Page.downloadProgress'


class DomContentEventFiredEventParams(TypedDict):
    timestamp: MonotonicTime


class FileChooserOpenedEventParams(TypedDict):
    frameId: FrameId
    mode: str
    backendNodeId: NotRequired[BackendNodeId]


class FrameAttachedEventParams(TypedDict):
    frameId: FrameId
    parentFrameId: FrameId
    stack: NotRequired[StackTrace]


class FrameClearedScheduledNavigationEventParams(TypedDict):
    frameId: FrameId


class FrameDetachedEventParams(TypedDict):
    frameId: FrameId
    reason: str


class FrameSubtreeWillBeDetachedEventParams(TypedDict):
    frameId: FrameId


class FrameNavigatedEventParams(TypedDict):
    frame: Frame
    type: NavigationType


class DocumentOpenedEventParams(TypedDict):
    frame: Frame


class FrameResizedEventParams(TypedDict):
    pass


class FrameStartedNavigatingEventParams(TypedDict):
    frameId: FrameId
    url: str
    loaderId: LoaderId
    navigationType: str


class FrameRequestedNavigationEventParams(TypedDict):
    frameId: FrameId
    reason: ClientNavigationReason
    url: str
    disposition: ClientNavigationDisposition


class FrameScheduledNavigationEventParams(TypedDict):
    frameId: FrameId
    delay: float
    reason: ClientNavigationReason
    url: str


class FrameStartedLoadingEventParams(TypedDict):
    frameId: FrameId


class FrameStoppedLoadingEventParams(TypedDict):
    frameId: FrameId


class DownloadWillBeginEventParams(TypedDict):
    frameId: FrameId
    guid: str
    url: str
    suggestedFilename: str


class DownloadProgressEventParams(TypedDict):
    guid: str
    totalBytes: float
    receivedBytes: float
    state: str


class InterstitialHiddenEventParams(TypedDict):
    pass


class InterstitialShownEventParams(TypedDict):
    pass


class JavascriptDialogClosedEventParams(TypedDict):
    frameId: FrameId
    result: bool
    userInput: str


class JavascriptDialogOpeningEventParams(TypedDict):
    url: str
    frameId: FrameId
    message: str
    type: DialogType
    hasBrowserHandler: bool
    defaultPrompt: NotRequired[str]


class LifecycleEventEventParams(TypedDict):
    frameId: FrameId
    loaderId: LoaderId
    name: str
    timestamp: MonotonicTime


class BackForwardCacheNotUsedEventParams(TypedDict):
    loaderId: LoaderId
    frameId: FrameId
    notRestoredExplanations: list[BackForwardCacheNotRestoredExplanation]
    notRestoredExplanationsTree: NotRequired[BackForwardCacheNotRestoredExplanationTree]


class LoadEventFiredEventParams(TypedDict):
    timestamp: MonotonicTime


class NavigatedWithinDocumentEventParams(TypedDict):
    frameId: FrameId
    url: str
    navigationType: str


class ScreencastFrameEventParams(TypedDict):
    data: str
    metadata: ScreencastFrameMetadata
    sessionId: int


class ScreencastVisibilityChangedEventParams(TypedDict):
    visible: bool


class WindowOpenEventParams(TypedDict):
    url: str
    windowName: str
    windowFeatures: list[str]
    userGesture: bool


class CompilationCacheProducedEventParams(TypedDict):
    url: str
    data: str


DomContentEventFiredEvent = CDPEvent[DomContentEventFiredEventParams]
FileChooserOpenedEvent = CDPEvent[FileChooserOpenedEventParams]
FrameAttachedEvent = CDPEvent[FrameAttachedEventParams]
FrameClearedScheduledNavigationEvent = CDPEvent[FrameClearedScheduledNavigationEventParams]
FrameDetachedEvent = CDPEvent[FrameDetachedEventParams]
FrameSubtreeWillBeDetachedEvent = CDPEvent[FrameSubtreeWillBeDetachedEventParams]
FrameNavigatedEvent = CDPEvent[FrameNavigatedEventParams]
DocumentOpenedEvent = CDPEvent[DocumentOpenedEventParams]
FrameResizedEvent = CDPEvent[FrameResizedEventParams]
FrameStartedNavigatingEvent = CDPEvent[FrameStartedNavigatingEventParams]
FrameRequestedNavigationEvent = CDPEvent[FrameRequestedNavigationEventParams]
FrameScheduledNavigationEvent = CDPEvent[FrameScheduledNavigationEventParams]
FrameStartedLoadingEvent = CDPEvent[FrameStartedLoadingEventParams]
FrameStoppedLoadingEvent = CDPEvent[FrameStoppedLoadingEventParams]
DownloadWillBeginEvent = CDPEvent[DownloadWillBeginEventParams]
DownloadProgressEvent = CDPEvent[DownloadProgressEventParams]
InterstitialHiddenEvent = CDPEvent[InterstitialHiddenEventParams]
InterstitialShownEvent = CDPEvent[InterstitialShownEventParams]
JavascriptDialogClosedEvent = CDPEvent[JavascriptDialogClosedEventParams]
JavascriptDialogOpeningEvent = CDPEvent[JavascriptDialogOpeningEventParams]
LifecycleEventEvent = CDPEvent[LifecycleEventEventParams]
BackForwardCacheNotUsedEvent = CDPEvent[BackForwardCacheNotUsedEventParams]
LoadEventFiredEvent = CDPEvent[LoadEventFiredEventParams]
NavigatedWithinDocumentEvent = CDPEvent[NavigatedWithinDocumentEventParams]
ScreencastFrameEvent = CDPEvent[ScreencastFrameEventParams]
ScreencastVisibilityChangedEvent = CDPEvent[ScreencastVisibilityChangedEventParams]
WindowOpenEvent = CDPEvent[WindowOpenEventParams]
CompilationCacheProducedEvent = CDPEvent[CompilationCacheProducedEventParams]


================================================
FILE: pydoll/protocol/page/methods.py
================================================
from enum import Enum

from typing_extensions import NotRequired, TypedDict

from pydoll.protocol.base import Command, EmptyParams, EmptyResponse, Response
from pydoll.protocol.debugger.types import SearchMatch
from pydoll.protocol.dom.types import Rect
from pydoll.protocol.io.types import StreamHandle
from pydoll.protocol.network.types import LoaderId
from pydoll.protocol.page.types import (
    AdScriptAncestry,
    AppManifestError,
    AppManifestParsedProperties,
    AutoResponseMode,
    CompilationCacheParams,
    FontFamilies,
    FontSizes,
    FrameId,
    FrameResourceTree,
    FrameTree,
    InstallabilityError,
    LayoutViewport,
    NavigationEntry,
    OriginTrial,
    PermissionsPolicyFeatureState,
    ReferrerPolicy,
    ScreencastFormat,
    ScreenshotFormat,
    ScriptFontFamilies,
    ScriptIdentifier,
    TransferMode,
    TransitionType,
    Viewport,
    VisualViewport,
    WebAppManifest,
    WebLifecycleState,
)
from pydoll.protocol.runtime.types import ExecutionContextId


class PageMethod(str, Enum):
    ADD_SCRIPT_TO_EVALUATE_ON_LOAD = 'Page.addScriptToEvaluateOnLoad'
    ADD_SCRIPT_TO_EVALUATE_ON_NEW_DOCUMENT = 'Page.addScriptToEvaluateOnNewDocument'
    BRING_TO_FRONT = 'Page.bringToFront'
    CAPTURE_SCREENSHOT = 'Page.captureScreenshot'
    CAPTURE_SNAPSHOT = 'Page.captureSnapshot'
    CLEAR_COMPILATION_CACHE = 'Page.clearCompilationCache'
    CLOSE = 'Page.close'
    CRASH = 'Page.crash'
    CREATE_ISOLATED_WORLD = 'Page.createIsolatedWorld'
    DISABLE = 'Page.disable'
    ENABLE = 'Page.enable'
    GENERATE_TEST_REPORT = 'Page.generateTestReport'
    GET_AD_SCRIPT_ANCESTRY_IDS = 'Page.getAdScriptAncestryIds'
    GET_APP_ID = 'Page.getAppId'
    GET_APP_MANIFEST = 'Page.getAppManifest'
    GET_FRAME_TREE = 'Page.getFrameTree'
    GET_INSTALLABILITY_ERRORS = 'Page.getInstallabilityErrors'
    GET_LAYOUT_METRICS = 'Page.getLayoutMetrics'
    GET_MANIFEST_ICONS = 'Page.getManifestIcons'
    GET_NAVIGATION_HISTORY = 'Page.getNavigationHistory'
    GET_ORIGIN_TRIALS = 'Page.getOriginTrials'
    GET_PERMISSIONS_POLICY_STATE = 'Page.getPermissionsPolicyState'
    GET_RESOURCE_CONTENT = 'Page.getResourceContent'
    GET_RESOURCE_TREE = 'Page.getResourceTree'
    HANDLE_JAVASCRIPT_DIALOG = 'Page.handleJavaScriptDialog'
    NAVIGATE = 'Page.navigate'
    NAVIGATE_TO_HISTORY_ENTRY = 'Page.navigateToHistoryEntry'
    PRINT_TO_PDF = 'Page.printToPDF'
    PRODUCE_COMPILATION_CACHE = 'Page.produceCompilationCache'
    RELOAD = 'Page.reload'
    REMOVE_SCRIPT_TO_EVALUATE_ON_LOAD = 'Page.removeScriptToEvaluateOnLoad'
    REMOVE_SCRIPT_TO_EVALUATE_ON_NEW_DOCUMENT = 'Page.removeScriptToEvaluateOnNewDocument'
    RESET_NAVIGATION_HISTORY = 'Page.resetNavigationHistory'
    SCREENCAST_FRAME_ACK = 'Page.screencastFrameAck'
    SEARCH_IN_RESOURCE = 'Page.searchInResource'
    SET_AD_BLOCKING_ENABLED = 'Page.setAdBlockingEnabled'
    SET_BYPASS_CSP = 'Page.setBypassCSP'
    SET_DOCUMENT_CONTENT = 'Page.setDocumentContent'
    SET_FONT_FAMILIES = 'Page.setFontFamilies'
    SET_FONT_SIZES = 'Page.setFontSizes'
    SET_INTERCEPT_FILE_CHOOSER_DIALOG = 'Page.setInterceptFileChooserDialog'
    SET_LIFECYCLE_EVENTS_ENABLED = 'Page.setLifecycleEventsEnabled'
    SET_PRERENDERING_ALLOWED = 'Page.setPrerenderingAllowed'
    SET_RPH_REGISTRATION_MODE = 'Page.setRPHRegistrationMode'
    SET_SPC_TRANSACTION_MODE = 'Page.setSPCTransactionMode'
    SET_WEB_LIFECYCLE_STATE = 'Page.setWebLifecycleState'
    START_SCREENCAST = 'Page.startScreencast'
    STOP_LOADING = 'Page.stopLoading'
    STOP_SCREENCAST = 'Page.stopScreencast'
    WAIT_FOR_DEBUGGER = 'Page.waitForDebugger'
    ADD_COMPILATION_CACHE = 'Page.addCompilationCache'


class AddScriptToEvaluateOnNewDocumentParams(TypedDict):
    """Parameters for addScriptToEvaluateOnNewDocument."""

    source: str
    worldName: NotRequired[str]
    includeCommandLineAPI: NotRequired[bool]
    runImmediately: NotRequired[bool]


class CaptureScreenshotParams(TypedDict, total=False):
    """Parameters for captureScreenshot."""

    format: ScreenshotFormat
    quality: int
    clip: Viewport
    fromSurface: bool
    captureBeyondViewport: bool
    optimizeForSpeed: bool


class CaptureSnapshotParams(TypedDict, total=False):
    """Parameters for captureSnapshot."""

    format: str


class CreateIsolatedWorldParams(TypedDict):
    """Parameters for createIsolatedWorld."""

    frameId: FrameId
    worldName: NotRequired[str]
    grantUniveralAccess: NotRequired[bool]


class GetAppManifestParams(TypedDict, total=False):
    """Parameters for getAppManifest."""

    manifestId: str


class GetAdScriptAncestryParams(TypedDict):
    """Parameters for getAdScriptAncestry."""

    frameId: FrameId


class GetPermissionsPolicyStateParams(TypedDict):
    """Parameters for getPermissionsPolicyState."""

    frameId: FrameId


class GetOriginTrialsParams(TypedDict):
    """Parameters for getOriginTrials."""

    frameId: FrameId


class GetResourceContentParams(TypedDict):
    """Parameters for getResourceContent."""

    frameId: FrameId
    url: str


class HandleJavaScriptDialogParams(TypedDict):
    """Parameters for handleJavaScriptDialog."""

    accept: bool
    promptText: NotRequired[str]


class NavigateParams(TypedDict):
    """Parameters for navigate."""

    url: str
    referrer: NotRequired[str]
    transitionType: NotRequired[TransitionType]
    frameId: NotRequired[FrameId]
    referrerPolicy: NotRequired[ReferrerPolicy]


class NavigateToHistoryEntryParams(TypedDict):
    """Parameters for navigateToHistoryEntry."""

    entryId: int


class EnableParams(TypedDict):
    enableFileChooserOpenedEvent: NotRequired[bool]


class PrintToPDFParams(TypedDict, total=False):
    """Parameters for printToPDF."""

    landscape: bool
    displayHeaderFooter: bool
    printBackground: bool
    scale: float
    paperWidth: float
    paperHeight: float
    marginTop: float
    marginBottom: float
    marginLeft: float
    marginRight: float
    pageRanges: str
    headerTemplate: str
    footerTemplate: str
    preferCSSPageSize: bool
    transferMode: TransferMode
    generateTaggedPDF: bool
    generateDocumentOutline: bool


class ReloadParams(TypedDict, total=False):
    """Parameters for reload."""

    ignoreCache: bool
    scriptToEvaluateOnLoad: str
    loaderId: LoaderId


class RemoveScriptToEvaluateOnNewDocumentParams(TypedDict):
    """Parameters for removeScriptToEvaluateOnNewDocument."""

    identifier: ScriptIdentifier


class ScreencastFrameAckParams(TypedDict):
    """Parameters for screencastFrameAck."""

    sessionId: int


class SearchInResourceParams(TypedDict):
    """Parameters for searchInResource."""

    frameId: FrameId
    url: str
    query: str
    caseSensitive: NotRequired[bool]
    isRegex: NotRequired[bool]


class SetAdBlockingEnabledParams(TypedDict):
    """Parameters for setAdBlockingEnabled."""

    enabled: bool


class SetBypassCSPParams(TypedDict):
    """Parameters for setBypassCSP."""

    enabled: bool


class AddScriptToEvaluateOnLoadParams(TypedDict):
    """Parameters for addScriptToEvaluateOnLoad."""

    scriptSource: str


class SetDocumentContentParams(TypedDict):
    """Parameters for setDocumentContent."""

    frameId: FrameId
    html: str


class SetInterceptFileChooserDialogParams(TypedDict):
    """Parameters for setInterceptFileChooserDialog."""

    enabled: bool
    cancel: NotRequired[bool]


class SetLifecycleEventsEnabledParams(TypedDict):
    """Parameters for setLifecycleEventsEnabled."""

    enabled: bool


class AddCompilationCacheParams(TypedDict):
    """Parameters for addCompilationCache."""

    url: str
    data: str


class GenerateTestReportParams(TypedDict):
    """Parameters for generateTestReport."""

    message: str
    group: NotRequired[str]


class GetAdScriptAncestryIdsParams(TypedDict):
    """Parameters for getAdScriptAncestryIds."""

    frameId: FrameId


class GetAppIdParams(TypedDict, total=False):
    """Parameters for getAppId."""

    appId: str
    recommendedId: str


class GetManifestIconsParams(TypedDict):
    """Parameters for getManifestIcons."""

    pass


class RemoveScriptToEvaluateOnLoadParams(TypedDict):
    """Parameters for removeScriptToEvaluateOnLoad."""

    identifier: ScriptIdentifier


class SetFontFamiliesParams(TypedDict):
    """Parameters for setFontFamilies."""

    fontFamilies: FontFamilies
    forScripts: NotRequired[list[ScriptFontFamilies]]


class SetFontSizesParams(TypedDict):
    """Parameters for setFontSizes."""

    fontSizes: FontSizes


class SetPrerenderingAllowedParams(TypedDict):
    """Parameters for setPrerenderingAllowed."""

    isAllowed: bool


class SetRPHRegistrationModeParams(TypedDict):
    """Parameters for setRPHRegistrationMode."""

    mode: AutoResponseMode


class SetSPCTransactionModeParams(TypedDict):
    """Parameters for setSPCTransactionMode."""

    mode: AutoResponseMode


class SetWebLifecycleStateParams(TypedDict):
    """Parameters for setWebLifecycleState."""

    state: WebLifecycleState


class StartScreencastParams(TypedDict, total=False):
    """Parameters for startScreencast."""

    format: ScreencastFormat
    quality: int
    maxWidth: int
    maxHeight: int
    everyNthFrame: int


class ProduceCompilationCacheParams(TypedDict):
    """Parameters for produceCompilationCache."""

    scripts: list[CompilationCacheParams]


class AddScriptToEvaluateOnNewDocumentResult(TypedDict):
    identifier: ScriptIdentifier


class CaptureScreenshotResult(TypedDict):
    data: str


class CaptureSnapshotResult(TypedDict):
    data: str


class CreateIsolatedWorldResult(TypedDict):
    executionContextId: ExecutionContextId


class GetAppManifestResult(TypedDict):
    url: str
    errors: list[AppManifestError]
    data: NotRequired[str]
    parsed: NotRequired[AppManifestParsedProperties]
    manifest: NotRequired[WebAppManifest]


class GetInstallabilityErrorsResult(TypedDict):
    installabilityErrors: list[InstallabilityError]


class GetAppIdResult(TypedDict, total=False):
    """Result for getAppId."""

    appId: str
    recommendedId: str


class GetAdScriptAncestryResult(TypedDict, total=False):
    adScriptAncestry: AdScriptAncestry


class GetFrameTreeResult(TypedDict):
    frameTree: FrameTree


class GetLayoutMetricsResult(TypedDict):
    layoutViewport: LayoutViewport
    visualViewport: VisualViewport
    contentSize: Rect
    cssLayoutViewport: LayoutViewport
    cssVisualViewport: VisualViewport
    cssContentSize: Rect


class GetNavigationHistoryResult(TypedDict):
    currentIndex: int
    entries: list[NavigationEntry]


class GetPermissionsPolicyStateResult(TypedDict):
    states: list[PermissionsPolicyFeatureState]


class GetOriginTrialsResult(TypedDict):
    originTrials: list[OriginTrial]


class GetResourceContentResult(TypedDict):
    content: str
    base64Encoded: bool


class GetResourceTreeResult(TypedDict):
    frameTree: FrameResourceTree


class PrintToPDFResult(TypedDict):
    data: str
    stream: NotRequired[StreamHandle]


class SearchInResourceResult(TypedDict):
    result: list[SearchMatch]


class NavigateResult(TypedDict):
    """Result for navigate."""

    frameId: FrameId
    loaderId: NotRequired[LoaderId]
    errorText: NotRequired[str]
    isDownload: NotRequired[bool]


class AddScriptToEvaluateOnLoadResult(TypedDict):
    """Result for addScriptToEvaluateOnLoad."""

    identifier: ScriptIdentifier


class GetManifestIconsResult(TypedDict):
    """Result for getManifestIcons."""

    primaryIcon: NotRequired[str]


class GetAdScriptAncestryIdsResult(TypedDict):
    """Result for getAdScriptAncestryIds."""

    adScriptAncestry: NotRequired[AdScriptAncestry]


AddScriptToEvaluateOnLoadResponse = Response[AddScriptToEvaluateOnLoadResult]
AddScriptToEvaluateOnNewDocumentResponse = Response[AddScriptToEvaluateOnNewDocumentResult]
CaptureScreenshotResponse = Response[CaptureScreenshotResult]
CaptureSnapshotResponse = Response[CaptureSnapshotResult]
CreateIsolatedWorldResponse = Response[CreateIsolatedWorldResult]
GetAdScriptAncestryIdsResponse = Response[GetAdScriptAncestryIdsResult]
GetAdScriptAncestryResponse = Response[GetAdScriptAncestryResult]
GetAppIdResponse = Response[GetAppIdResult]
GetAppManifestResponse = Response[GetAppManifestResult]
GetFrameTreeResponse = Response[GetFrameTreeResult]
GetInstallabilityErrorsResponse = Response[GetInstallabilityErrorsResult]
GetLayoutMetricsResponse = Response[GetLayoutMetricsResult]
GetManifestIconsResponse = Response[GetManifestIconsResult]
GetNavigationHistoryResponse = Response[GetNavigationHistoryResult]
GetOriginTrialsResponse = Response[GetOriginTrialsResult]
GetPermissionsPolicyStateResponse = Response[GetPermissionsPolicyStateResult]
GetResourceContentResponse = Response[GetResourceContentResult]
GetResourceTreeResponse = Response[GetResourceTreeResult]
NavigateResponse = Response[NavigateResult]
PrintToPDFResponse = Response[PrintToPDFResult]
SearchInResourceResponse = Response[SearchInResourceResult]


AddCompilationCacheCommand = Command[AddCompilationCacheParams, Response[EmptyResponse]]
AddScriptToEvaluateOnLoadCommand = Command[
    AddScriptToEvaluateOnLoadParams, AddScriptToEvaluateOnLoadResponse
]
AddScriptToEvaluateOnNewDocumentCommand = Command[
    AddScriptToEvaluateOnNewDocumentParams, AddScriptToEvaluateOnNewDocumentResponse
]
BringToFrontCommand = Command[EmptyParams, Response[EmptyResponse]]
CaptureScreenshotCommand = Command[CaptureScreenshotParams, CaptureScreenshotResponse]
CaptureSnapshotCommand = Command[CaptureSnapshotParams, CaptureSnapshotResponse]
ClearCompilationCacheCommand = Command[EmptyParams, Response[EmptyResponse]]
CloseCommand = Command[EmptyParams, Response[EmptyResponse]]
CrashCommand = Command[EmptyParams, Response[EmptyResponse]]
CreateIsolatedWorldCommand = Command[CreateIsolatedWorldParams, CreateIsolatedWorldResponse]
DisableCommand = Command[EmptyParams, Response[EmptyResponse]]
EnableCommand = Command[EnableParams, Response[EmptyResponse]]
GenerateTestReportCommand = Command[GenerateTestReportParams, Response[EmptyResponse]]
GetAdScriptAncestryCommand = Command[GetAdScriptAncestryParams, GetAdScriptAncestryResponse]
GetAdScriptAncestryIdsCommand = Command[
    GetAdScriptAncestryIdsParams, GetAdScriptAncestryIdsResponse
]
GetAppIdCommand = Command[GetAppIdParams, GetAppIdResponse]
GetAppManifestCommand = Command[GetAppManifestParams, GetAppManifestResponse]
GetFrameTreeCommand = Command[EmptyParams, GetFrameTreeResponse]
GetInstallabilityErrorsCommand = Command[EmptyParams, GetInstallabilityErrorsResponse]
GetLayoutMetricsCommand = Command[EmptyParams, GetLayoutMetricsResponse]
GetManifestIconsCommand = Command[EmptyParams, GetManifestIconsResponse]
GetNavigationHistoryCommand = Command[EmptyParams, GetNavigationHistoryResponse]
GetOriginTrialsCommand = Command[GetOriginTrialsParams, GetOriginTrialsResponse]
GetPermissionsPolicyStateCommand = Command[
    GetPermissionsPolicyStateParams, GetPermissionsPolicyStateResponse
]
GetResourceContentCommand = Command[GetResourceContentParams, GetResourceContentResponse]
GetResourceTreeCommand = Command[EmptyParams, GetResourceTreeResponse]
HandleJavaScriptDialogCommand = Command[HandleJavaScriptDialogParams, Response[EmptyResponse]]
NavigateCommand = Command[NavigateParams, NavigateResponse]
NavigateToHistoryEntryCommand = Command[NavigateToHistoryEntryParams, Response[EmptyResponse]]
PrintToPDFCommand = Command[PrintToPDFParams, PrintToPDFResponse]
ProduceCompilationCacheCommand = Command[ProduceCompilationCacheParams, Response[EmptyResponse]]
ReloadCommand = Command[ReloadParams, Response[EmptyResponse]]
RemoveScriptToEvaluateOnLoadCommand = Command[
    RemoveScriptToEvaluateOnLoadParams, Response[EmptyResponse]
]
RemoveScriptToEvaluateOnNewDocumentCommand = Command[
    RemoveScriptToEvaluateOnNewDocumentParams, Response[EmptyResponse]
]
ResetNavigationHistoryCommand = Command[EmptyParams, Response[EmptyResponse]]
ScreencastFrameAckCommand = Command[ScreencastFrameAckParams, Response[EmptyResponse]]
SearchInResourceCommand = Command[SearchInResourceParams, SearchInResourceResponse]
SetAdBlockingEnabledCommand = Command[SetAdBlockingEnabledParams, Response[EmptyResponse]]
SetBypassCSPCommand = Command[SetBypassCSPParams, Response[EmptyResponse]]
SetDocumentContentCommand = Command[SetDocumentContentParams, Response[EmptyResponse]]
SetFontFamiliesCommand = Command[SetFontFamiliesParams, Response[EmptyResponse]]
SetFontSizesCommand = Command[SetFontSizesParams, Response[EmptyResponse]]
SetInterceptFileChooserDialogCommand = Command[
    SetInterceptFileChooserDialogParams, Response[EmptyResponse]
]
SetLifecycleEventsEnabledCommand = Command[SetLifecycleEventsEnabledParams, Response[EmptyResponse]]
SetPrerenderingAllowedCommand = Command[SetPrerenderingAllowedParams, Response[EmptyResponse]]
SetRPHRegistrationModeCommand = Command[SetRPHRegistrationModeParams, Response[EmptyResponse]]
SetSPCTransactionModeCommand = Command[SetSPCTransactionModeParams, Response[EmptyResponse]]
SetWebLifecycleStateCommand = Command[SetWebLifecycleStateParams, Response[EmptyResponse]]
StartScreencastCommand = Command[StartScreencastParams, Response[EmptyResponse]]
StopLoadingCommand = Command[EmptyParams, Response[EmptyResponse]]
StopScreencastCommand = Command[EmptyParams, Response[EmptyResponse]]
WaitForDebuggerCommand = Command[EmptyParams, Response[EmptyResponse]]


================================================
FILE: pydoll/protocol/page/types.py
================================================
from enum import Enum

from typing_extensions import NotRequired, TypedDict

from pydoll.protocol.network.types import LoaderId, ResourceType, TimeSinceEpoch
from pydoll.protocol.runtime.types import ScriptId, UniqueDebuggerId

FrameId = str
ScriptIdentifier = str


class AdFrameType(str, Enum):
    """Ad frame types."""

    NONE = 'none'
    CHILD = 'child'
    ROOT = 'root'


class AdFrameExplanation(str, Enum):
    """Ad frame explanation types."""

    PARENT_IS_AD = 'ParentIsAd'
    CREATED_BY_AD_SCRIPT = 'CreatedByAdScript'
    MATCHED_BLOCKING_RULE = 'MatchedBlockingRule'


class SecureContextType(str, Enum):
    """Secure context types."""

    SECURE = 'Secure'
    SECURE_LOCALHOST = 'SecureLocalhost'
    INSECURE_SCHEME = 'InsecureScheme'
    INSECURE_ANCESTOR = 'InsecureAncestor'


class CrossOriginIsolatedContextType(str, Enum):
    """Cross-origin isolated context types."""

    ISOLATED = 'Isolated'
    NOT_ISOLATED = 'NotIsolated'
    NOT_ISOLATED_FEATURE_DISABLED = 'NotIsolatedFeatureDisabled'


class GatedAPIFeatures(str, Enum):
    """Gated API features."""

    SHARED_ARRAY_BUFFERS = 'SharedArrayBuffers'
    SHARED_ARRAY_BUFFERS_TRANSFER_ALLOWED = 'SharedArrayBuffersTransferAllowed'
    PERFORMANCE_MEASURE_MEMORY = 'PerformanceMeasureMemory'
    PERFORMANCE_PROFILE = 'PerformanceProfile'


class PermissionsPolicyFeature(str, Enum):
    """Permissions policy features."""

    ACCELEROMETER = 'accelerometer'
    ALL_SCREENS_CAPTURE = 'all-screens-capture'
    AMBIENT_LIGHT_SENSOR = 'ambient-light-sensor'
    ARIA_NOTIFY = 'aria-notify'
    ATTRIBUTION_REPORTING = 'attribution-reporting'
    AUTOPLAY = 'autoplay'
    BLUETOOTH = 'bluetooth'
    BROWSING_TOPICS = 'browsing-topics'
    CAMERA = 'camera'
    CAPTURED_SURFACE_CONTROL = 'captured-surface-control'
    CH_DPR = 'ch-dpr'
    CH_DEVICE_MEMORY = 'ch-device-memory'
    CH_DOWNLINK = 'ch-downlink'
    CH_ECT = 'ch-ect'
    CH_PREFERS_COLOR_SCHEME = 'ch-prefers-color-scheme'
    CH_PREFERS_REDUCED_MOTION = 'ch-prefers-reduced-motion'
    CH_PREFERS_REDUCED_TRANSPARENCY = 'ch-prefers-reduced-transparency'
    CH_RTT = 'ch-rtt'
    CH_SAVE_DATA = 'ch-save-data'
    CH_UA = 'ch-ua'
    CH_UA_ARCH = 'ch-ua-arch'
    CH_UA_BITNESS = 'ch-ua-bitness'
    CH_UA_HIGH_ENTROPY_VALUES = 'ch-ua-high-entropy-values'
    CH_UA_PLATFORM = 'ch-ua-platform'
    CH_UA_MODEL = 'ch-ua-model'
    CH_UA_MOBILE = 'ch-ua-mobile'
    CH_UA_FORM_FACTORS = 'ch-ua-form-factors'
    CH_UA_FULL_VERSION = 'ch-ua-full-version'
    CH_UA_FULL_VERSION_LIST = 'ch-ua-full-version-list'
    CH_UA_PLATFORM_VERSION = 'ch-ua-platform-version'
    CH_UA_WOW64 = 'ch-ua-wow64'
    CH_VIEWPORT_HEIGHT = 'ch-viewport-height'
    CH_VIEWPORT_WIDTH = 'ch-viewport-width'
    CH_WIDTH = 'ch-width'
    CLIPBOARD_READ = 'clipboard-read'
    CLIPBOARD_WRITE = 'clipboard-write'
    COMPUTE_PRESSURE = 'compute-pressure'
    CONTROLLED_FRAME = 'controlled-frame'
    CROSS_ORIGIN_ISOLATED = 'cross-origin-isolated'
    DEFERRED_FETCH = 'deferred-fetch'
    DEFERRED_FETCH_MINIMAL = 'deferred-fetch-minimal'
    DEVICE_ATTRIBUTES = 'device-attributes'
    DIGITAL_CREDENTIALS_GET = 'digital-credentials-get'
    DIRECT_SOCKETS = 'direct-sockets'
    DIRECT_SOCKETS_PRIVATE = 'direct-sockets-private'
    DISPLAY_CAPTURE = 'display-capture'
    DOCUMENT_DOMAIN = 'document-domain'
    ENCRYPTED_MEDIA = 'encrypted-media'
    EXECUTION_WHILE_OUT_OF_VIEWPORT = 'execution-while-out-of-viewport'
    EXECUTION_WHILE_NOT_RENDERED = 'execution-while-not-rendered'
    FENCED_UNPARTITIONED_STORAGE_READ = 'fenced-unpartitioned-storage-read'
    FOCUS_WITHOUT_USER_ACTIVATION = 'focus-without-user-activation'
    FULLSCREEN = 'fullscreen'
    FROBULATE = 'frobulate'
    GAMEPAD = 'gamepad'
    GEOLOCATION = 'geolocation'
    GYROSCOPE = 'gyroscope'
    HID = 'hid'
    IDENTITY_CREDENTIALS_GET = 'identity-credentials-get'
    IDLE_DETECTION = 'idle-detection'
    INTEREST_COHORT = 'interest-cohort'
    JOIN_AD_INTEREST_GROUP = 'join-ad-interest-group'
    KEYBOARD_MAP = 'keyboard-map'
    LANGUAGE_DETECTOR = 'language-detector'
    LANGUAGE_MODEL = 'language-model'
    LOCAL_FONTS = 'local-fonts'
    LOCAL_NETWORK_ACCESS = 'local-network-access'
    MAGNETOMETER = 'magnetometer'
    MEDIA_PLAYBACK_WHILE_NOT_VISIBLE = 'media-playback-while-not-visible'
    MICROPHONE = 'microphone'
    MIDI = 'midi'
    ON_DEVICE_SPEECH_RECOGNITION = 'on-device-speech-recognition'
    OTP_CREDENTIALS = 'otp-credentials'
    PAYMENT = 'payment'
    PICTURE_IN_PICTURE = 'picture-in-picture'
    POPINS = 'popins'
    PRIVATE_AGGREGATION = 'private-aggregation'
    PRIVATE_STATE_TOKEN_ISSUANCE = 'private-state-token-issuance'
    PRIVATE_STATE_TOKEN_REDEMPTION = 'private-state-token-redemption'
    PUBLICKEY_CREDENTIALS_CREATE = 'publickey-credentials-create'
    PUBLICKEY_CREDENTIALS_GET = 'publickey-credentials-get'
    RECORD_AD_AUCTION_EVENTS = 'record-ad-auction-events'
    REWRITER = 'rewriter'
    RUN_AD_AUCTION = 'run-ad-auction'
    SCREEN_WAKE_LOCK = 'screen-wake-lock'
    SERIAL = 'serial'
    SHARED_AUTOFILL = 'shared-autofill'
    SHARED_STORAGE = 'shared-storage'
    SHARED_STORAGE_SELECT_URL = 'shared-storage-select-url'
    SMART_CARD = 'smart-card'
    SPEAKER_SELECTION = 'speaker-selection'
    STORAGE_ACCESS = 'storage-access'
    SUB_APPS = 'sub-apps'
    SUMMARIZER = 'summarizer'
    SYNC_XHR = 'sync-xhr'
    TRANSLATOR = 'translator'
    UNLOAD = 'unload'
    USB = 'usb'
    USB_UNRESTRICTED = 'usb-unrestricted'
    VERTICAL_SCROLL = 'vertical-scroll'
    WEB_APP_INSTALLATION = 'web-app-installation'
    WEB_PRINTING = 'web-printing'
    WEB_SHARE = 'web-share'
    WINDOW_MANAGEMENT = 'window-management'
    WRITER = 'writer'
    XR_SPATIAL_TRACKING = 'xr-spatial-tracking'


class PermissionsPolicyBlockReason(str, Enum):
    """Permissions policy block reasons."""

    HEADER = 'Header'
    IFRAME_ATTRIBUTE = 'IframeAttribute'
    IN_FENCED_FRAME_TREE = 'InFencedFrameTree'
    IN_ISOLATED_APP = 'InIsolatedApp'


class BackForwardCacheNotRestoredReasonType(str, Enum):
    """Back/forward cache not restored explanation type."""

    SUPPORT_PENDING = 'SupportPending'
    PAGE_SUPPORT_NEEDED = 'PageSupportNeeded'
    CIRCUMSTANTIAL = 'Circumstantial'


class BackForwardCacheNotRestoredReason(str, Enum):
    NOT_PRIMARY_MAIN_FRAME = 'NotPrimaryMainFrame'
    BACK_FORWARD_CACHE_DISABLED = 'BackForwardCacheDisabled'
    RELATED_ACTIVE_CONTENTS_EXIST = 'RelatedActiveContentsExist'
    HTTP_STATUS_NOT_OK = 'HTTPStatusNotOK'
    SCHEME_NOT_HTTP_OR_HTTPS = 'SchemeNotHTTPOrHTTPS'
    LOADING = 'Loading'
    WAS_GRANTED_MEDIA_ACCESS = 'WasGrantedMediaAccess'
    DISABLE_FOR_RENDER_FRAME_HOST_CALLED = 'DisableForRenderFrameHostCalled'
    DOMAIN_NOT_ALLOWED = 'DomainNotAllowed'
    HTTP_METHOD_NOT_GET = 'HTTPMethodNotGET'
    SUBFRAME_IS_NAVIGATING = 'SubframeIsNavigating'
    TIMEOUT = 'Timeout'
    CACHE_LIMIT = 'CacheLimit'
    JAVASCRIPT_EXECUTION = 'JavaScriptExecution'
    RENDERER_PROCESS_KILLED = 'RendererProcessKilled'
    RENDERER_PROCESS_CRASHED = 'RendererProcessCrashed'
    SCHEDULER_TRACKED_FEATURE_USED = 'SchedulerTrackedFeatureUsed'
    CONFLICTING_BROWSING_INSTANCE = 'ConflictingBrowsingInstance'
    CACHE_FLUSHED = 'CacheFlushed'
    SERVICE_WORKER_VERSION_ACTIVATION = 'ServiceWorkerVersionActivation'
    SESSION_RESTORED = 'SessionRestored'
    SERVICE_WORKER_POST_MESSAGE = 'ServiceWorkerPostMessage'
    ENTERED_BACK_FORWARD_CACHE_BEFORE_SERVICE_WORKER_HOST_ADDED = (
        'EnteredBackForwardCacheBeforeServiceWorkerHostAdded'
    )
    RENDER_FRAME_HOST_REUSED_SAME_SITE = 'RenderFrameHostReused_SameSite'
    RENDER_FRAME_HOST_REUSED_CROSS_SITE = 'RenderFrameHostReused_CrossSite'
    SERVICE_WORKER_CLAIM = 'ServiceWorkerClaim'
    IGNORE_EVENT_AND_EVICT = 'IgnoreEventAndEvict'
    HAVE_INNER_CONTENTS = 'HaveInnerContents'
    TIMEOUT_PUTTING_IN_CACHE = 'TimeoutPuttingInCache'
    BACK_FORWARD_CACHE_DISABLED_BY_LOW_MEMORY = 'BackForwardCacheDisabledByLowMemory'
    BACK_FORWARD_CACHE_DISABLED_BY_COMMAND_LINE = 'BackForwardCacheDisabledByCommandLine'
    NETWORK_REQUEST_DATAPIPE_DRAINED_AS_BYTES_CONSUMER = (
        'NetworkRequestDatapipeDrainedAsBytesConsumer'
    )
    NETWORK_REQUEST_REDIRECTED = 'NetworkRequestRedirected'
    NETWORK_REQUEST_TIMEOUT = 'NetworkRequestTimeout'
    NETWORK_EXCEEDS_BUFFER_LIMIT = 'NetworkExceedsBufferLimit'
    NAVIGATION_CANCELLED_WHILE_RESTORING = 'NavigationCancelledWhileRestoring'
    NOT_MOST_RECENT_NAVIGATION_ENTRY = 'NotMostRecentNavigationEntry'
    BACK_FORWARD_CACHE_DISABLED_FOR_PRERENDER = 'BackForwardCacheDisabledForPrerender'
    USER_AGENT_OVERRIDE_DIFFERS = 'UserAgentOverrideDiffers'
    FOREGROUND_CACHE_LIMIT = 'ForegroundCacheLimit'
    BROWSING_INSTANCE_NOT_SWAPPED = 'BrowsingInstanceNotSwapped'
    BACK_FORWARD_CACHE_DISABLED_FOR_DELEGATE = 'BackForwardCacheDisabledForDelegate'
    UNLOAD_HANDLER_EXISTS_IN_MAIN_FRAME = 'UnloadHandlerExistsInMainFrame'
    UNLOAD_HANDLER_EXISTS_IN_SUB_FRAME = 'UnloadHandlerExistsInSubFrame'
    SERVICE_WORKER_UNREGISTRATION = 'ServiceWorkerUnregistration'
    CACHE_CONTROL_NO_STORE = 'CacheControlNoStore'
    CACHE_CONTROL_NO_STORE_COOKIE_MODIFIED = 'CacheControlNoStoreCookieModified'
    CACHE_CONTROL_NO_STORE_HTTP_ONLY_COOKIE_MODIFIED = 'CacheControlNoStoreHTTPOnlyCookieModified'
    NO_RESPONSE_HEAD = 'NoResponseHead'
    UNKNOWN = 'Unknown'
    ACTIVATION_NAVIGATIONS_DISALLOWED_FOR_BUG_1234857 = (
        'ActivationNavigationsDisallowedForBug1234857'
    )
    ERROR_DOCUMENT = 'ErrorDocument'
    FENCED_FRAMES_EMBEDDER = 'FencedFramesEmbedder'
    COOKIE_DISABLED = 'CookieDisabled'
    HTTP_AUTH_REQUIRED = 'HTTPAuthRequired'
    COOKIE_FLUSHED = 'CookieFlushed'
    BROADCAST_CHANNEL_ON_MESSAGE = 'BroadcastChannelOnMessage'
    WEB_VIEW_SETTINGS_CHANGED = 'WebViewSettingsChanged'
    WEB_VIEW_JAVASCRIPT_OBJECT_CHANGED = 'WebViewJavaScriptObjectChanged'
    WEB_VIEW_MESSAGE_LISTENER_INJECTED = 'WebViewMessageListenerInjected'
    WEB_VIEW_SAFE_BROWSING_ALLOWLIST_CHANGED = 'WebViewSafeBrowsingAllowlistChanged'
    WEB_VIEW_DOCUMENT_START_JAVASCRIPT_CHANGED = 'WebViewDocumentStartJavascriptChanged'
    WEB_SOCKET = 'WebSocket'
    WEB_TRANSPORT = 'WebTransport'
    WEB_RTC = 'WebRTC'
    MAIN_RESOURCE_HAS_CACHE_CONTROL_NO_STORE = 'MainResourceHasCacheControlNoStore'
    MAIN_RESOURCE_HAS_CACHE_CONTROL_NO_CACHE = 'MainResourceHasCacheControlNoCache'
    SUBRESOURCE_HAS_CACHE_CONTROL_NO_STORE = 'SubresourceHasCacheControlNoStore'
    SUBRESOURCE_HAS_CACHE_CONTROL_NO_CACHE = 'SubresourceHasCacheControlNoCache'
    CONTAINS_PLUGINS = 'ContainsPlugins'
    DOCUMENT_LOADED = 'DocumentLoaded'
    OUTSTANDING_NETWORK_REQUEST_OTHERS = 'OutstandingNetworkRequestOthers'
    REQUESTED_MIDI_PERMISSION = 'RequestedMIDIPermission'
    REQUESTED_AUDIO_CAPTURE_PERMISSION = 'RequestedAudioCapturePermission'
    REQUESTED_VIDEO_CAPTURE_PERMISSION = 'RequestedVideoCapturePermission'
    REQUESTED_BACK_FORWARD_CACHE_BLOCKED_SENSORS = 'RequestedBackForwardCacheBlockedSensors'
    REQUESTED_BACKGROUND_WORK_PERMISSION = 'RequestedBackgroundWorkPermission'
    BROADCAST_CHANNEL = 'BroadcastChannel'
    WEB_XR = 'WebXR'
    SHARED_WORKER = 'SharedWorker'
    SHARED_WORKER_MESSAGE = 'SharedWorkerMessage'
    WEB_LOCKS = 'WebLocks'
    WEB_HID = 'WebHID'
    WEB_SHARE = 'WebShare'
    REQUESTED_STORAGE_ACCESS_GRANT = 'RequestedStorageAccessGrant'
    WEB_NFC = 'WebNfc'
    OUTSTANDING_NETWORK_REQUEST_FETCH = 'OutstandingNetworkRequestFetch'
    OUTSTANDING_NETWORK_REQUEST_XHR = 'OutstandingNetworkRequestXHR'
    APP_BANNER = 'AppBanner'
    PRINTING = 'Printing'
    WEB_DATABASE = 'WebDatabase'
    PICTURE_IN_PICTURE = 'PictureInPicture'
    SPEECH_RECOGNIZER = 'SpeechRecognizer'
    IDLE_MANAGER = 'IdleManager'
    PAYMENT_MANAGER = 'PaymentManager'
    SPEECH_SYNTHESIS = 'SpeechSynthesis'
    KEYBOARD_LOCK = 'KeyboardLock'
    WEB_OTP_SERVICE = 'WebOTPService'
    OUTSTANDING_NETWORK_REQUEST_DIRECT_SOCKET = 'OutstandingNetworkRequestDirectSocket'
    INJECTED_JAVASCRIPT = 'InjectedJavascript'
    INJECTED_STYLE_SHEET = 'InjectedStyleSheet'
    KEEPALIVE_REQUEST = 'KeepaliveRequest'
    INDEXED_DB_EVENT = 'IndexedDBEvent'
    DUMMY = 'Dummy'
    JS_NETWORK_REQUEST_RECEIVED_CACHE_CONTROL_NO_STORE_RESOURCE = (
        'JsNetworkRequestReceivedCacheControlNoStoreResource'
    )
    WEB_RTC_STICKY = 'WebRTCSticky'
    WEB_TRANSPORT_STICKY = 'WebTransportSticky'
    WEB_SOCKET_STICKY = 'WebSocketSticky'
    SMART_CARD = 'SmartCard'
    LIVE_MEDIA_STREAM_TRACK = 'LiveMediaStreamTrack'
    UNLOAD_HANDLER = 'UnloadHandler'
    PARSER_ABORTED = 'ParserAborted'
    CONTENT_SECURITY_HANDLER = 'ContentSecurityHandler'
    CONTENT_WEB_AUTHENTICATION_API = 'ContentWebAuthenticationAPI'
    CONTENT_FILE_CHOOSER = 'ContentFileChooser'
    CONTENT_SERIAL = 'ContentSerial'
    CONTENT_FILE_SYSTEM_ACCESS = 'ContentFileSystemAccess'
    CONTENT_MEDIA_DEVICES_DISPATCHER_HOST = 'ContentMediaDevicesDispatcherHost'
    CONTENT_WEB_BLUETOOTH = 'ContentWebBluetooth'
    CONTENT_WEB_USB = 'ContentWebUSB'
    CONTENT_MEDIA_SESSION_SERVICE = 'ContentMediaSessionService'
    CONTENT_SCREEN_READER = 'ContentScreenReader'
    CONTENT_DISCARDED = 'ContentDiscarded'
    EMBEDDER_POPUP_BLOCKER_TAB_HELPER = 'EmbedderPopupBlockerTabHelper'
    EMBEDDER_SAFE_BROWSING_TRIGGERED_POPUP_BLOCKER = 'EmbedderSafeBrowsingTriggeredPopupBlocker'
    EMBEDDER_SAFE_BROWSING_THREAT_DETAILS = 'EmbedderSafeBrowsingThreatDetails'
    EMBEDDER_APP_BANNER_MANAGER = 'EmbedderAppBannerManager'
    EMBEDDER_DOM_DISTILLER_VIEWER_SOURCE = 'EmbedderDomDistillerViewerSource'
    EMBEDDER_DOM_DISTILLER_SELF_DELETING_REQUEST_DELEGATE = (
        'EmbedderDomDistillerSelfDeletingRequestDelegate'
    )
    EMBEDDER_OOM_INTERVENTION_TAB_HELPER = 'EmbedderOomInterventionTabHelper'
    EMBEDDER_OFFLINE_PAGE = 'EmbedderOfflinePage'
    EMBEDDER_CHROME_PASSWORD_MANAGER_CLIENT_BIND_CREDENTIAL_MANAGER = (
        'EmbedderChromePasswordManagerClientBindCredentialManager'
    )
    EMBEDDER_PERMISSION_REQUEST_MANAGER = 'EmbedderPermissionRequestManager'
    EMBEDDER_MODAL_DIALOG = 'EmbedderModalDialog'
    EMBEDDER_EXTENSIONS = 'EmbedderExtensions'
    EMBEDDER_EXTENSION_MESSAGING = 'EmbedderExtensionMessaging'
    EMBEDDER_EXTENSION_MESSAGING_FOR_OPEN_PORT = 'EmbedderExtensionMessagingForOpenPort'
    EMBEDDER_EXTENSION_SENT_MESSAGE_TO_CACHED_FRAME = 'EmbedderExtensionSentMessageToCachedFrame'
    REQUESTED_BY_WEB_VIEW_CLIENT = 'RequestedByWebViewClient'
    POST_MESSAGE_BY_WEB_VIEW_CLIENT = 'PostMessageByWebViewClient'
    CACHE_CONTROL_NO_STORE_DEVICE_BOUND_SESSION_TERMINATED = (
        'CacheControlNoStoreDeviceBoundSessionTerminated'
    )
    CACHE_LIMIT_PRUNED_ON_MODERATE_MEMORY_PRESSURE = 'CacheLimitPrunedOnModerateMemoryPressure'
    CACHE_LIMIT_PRUNED_ON_CRITICAL_MEMORY_PRESSURE = 'CacheLimitPrunedOnCriticalMemoryPressure'


class BackForwardCacheBlockingDetails(TypedDict):
    url: NotRequired[str]
    function: NotRequired[str]
    lineNumber: int
    columnNumber: int


class BackForwardCacheNotRestoredExplanation(TypedDict):
    """Back/forward cache not restored explanation."""

    type: BackForwardCacheNotRestoredReasonType
    reason: BackForwardCacheNotRestoredReason
    context: NotRequired[str]
    details: NotRequired[list[BackForwardCacheBlockingDetails]]


class BackForwardCacheNotRestoredExplanationTree(TypedDict):
    url: str
    explanations: list[BackForwardCacheNotRestoredExplanation]
    children: NotRequired[list['BackForwardCacheNotRestoredExplanationTree']]


class OriginTrialTokenStatus(str, Enum):
    """Origin trial token status."""

    SUCCESS = 'Success'
    NOT_SUPPORTED = 'NotSupported'
    INSECURE = 'Insecure'
    EXPIRED = 'Expired'
    WRONG_ORIGIN = 'WrongOrigin'
    INVALID_SIGNATURE = 'InvalidSignature'
    MALFORMED = 'Malformed'
    WRONG_VERSION = 'WrongVersion'
    FEATURE_DISABLED = 'FeatureDisabled'
    TOKEN_DISABLED = 'TokenDisabled'
    FEATURE_DISABLED_FOR_USER = 'FeatureDisabledForUser'
    UNKNOWN_TRIAL = 'UnknownTrial'


class OriginTrialStatus(str, Enum):
    """Origin trial status."""

    ENABLED = 'Enabled'
    VALID_TOKEN_NOT_PROVIDED = 'ValidTokenNotProvided'
    OS_NOT_SUPPORTED = 'OSNotSupported'
    TRIAL_NOT_ALLOWED = 'TrialNotAllowed'


class OriginTrialUsageRestriction(str, Enum):
    """Origin trial usage restriction."""

    NONE = 'None'
    SUBSET = 'Subset'


class TransitionType(str, Enum):
    """Transition types."""

    LINK = 'link'
    TYPED = 'typed'
    ADDRESS_BAR = 'address_bar'
    AUTO_BOOKMARK = 'auto_bookmark'
    AUTO_SUBFRAME = 'auto_subframe'
    MANUAL_SUBFRAME = 'manual_subframe'
    GENERATED = 'generated'
    AUTO_TOPLEVEL = 'auto_toplevel'
    FORM_SUBMIT = 'form_submit'
    RELOAD = 'reload'
    KEYWORD = 'keyword'
    KEYWORD_GENERATED = 'keyword_generated'
    OTHER = 'other'


class DialogType(str, Enum):
    """Dialog types."""

    ALERT = 'alert'
    CONFIRM = 'confirm'
    PROMPT = 'prompt'
    BEFOREUNLOAD = 'beforeunload'


class ClientNavigationReason(Enum):
    """Client navigation reasons."""

    ANCHOR_CLICK = 'anchorClick'
    FORM_SUBMISSION_GET = 'formSubmissionGet'
    FORM_SUBMISSION_POST = 'formSubmissionPost'
    HTTP_HEADER_REFRESH = 'httpHeaderRefresh'
    INITIAL_FRAME_NAVIGATION = 'initialFrameNavigation'
    META_TAG_REFRESH = 'metaTagRefresh'
    OTHER = 'other'
    PAGE_BLOCK_INTERSTITIAL = 'pageBlockInterstitial'
    RELOAD = 'reload'
    SCRIPT_INITIATED = 'scriptInitiated'


class ClientNavigationDisposition(str, Enum):
    """Client navigation dispositions."""

    CURRENT_TAB = 'currentTab'
    NEW_TAB = 'newTab'
    NEW_WINDOW = 'newWindow'
    DOWNLOAD = 'download'


class ReferrerPolicy(str, Enum):
    """Referrer policy types."""

    NO_REFERRER = 'noReferrer'
    NO_REFERRER_WHEN_DOWNGRADE = 'noReferrerWhenDowngrade'
    ORIGIN = 'origin'
    ORIGIN_WHEN_CROSS_ORIGIN = 'originWhenCrossOrigin'
    SAME_ORIGIN = 'sameOrigin'
    STRICT_ORIGIN = 'strictOrigin'
    STRICT_ORIGIN_WHEN_CROSS_ORIGIN = 'strictOriginWhenCrossOrigin'
    UNSAFE_URL = 'unsafeUrl'


class NavigationType(str, Enum):
    """Navigation types."""

    NAVIGATION = 'Navigation'
    BACK_FORWARD_CACHE_RESTORE = 'BackForwardCacheRestore'


class AdFrameStatus(TypedDict):
    """Ad frame status."""

    adFrameType: AdFrameType
    explanations: NotRequired[list[AdFrameExplanation]]


class AdScriptId(TypedDict):
    """Ad script identifier."""

    scriptId: ScriptId
    debuggerId: UniqueDebuggerId


class AdScriptAncestry(TypedDict):
    """Ad script ancestry."""

    ancestryChain: list[AdScriptId]
    rootScriptFilterlistRule: NotRequired[str]


class PermissionsPolicyBlockLocator(TypedDict):
    """Permissions policy block locator."""

    frameId: FrameId
    blockReason: PermissionsPolicyBlockReason


class PermissionsPolicyFeatureState(TypedDict):
    """Permissions policy feature state."""

    feature: PermissionsPolicyFeature
    allowed: bool
    locator: NotRequired[PermissionsPolicyBlockLocator]


class OriginTrialToken(TypedDict):
    """Origin trial token."""

    origin: str
    matchSubDomains: bool
    trialName: str
    expiryTime: TimeSinceEpoch
    isThirdParty: bool
    usageRestriction: OriginTrialUsageRestriction


class OriginTrialTokenWithStatus(TypedDict):
    """Origin trial token with status."""

    rawTokenText: str
    status: OriginTrialTokenStatus
    parsedToken: NotRequired[OriginTrialToken]


class OriginTrial(TypedDict):
    """Origin trial."""

    trialName: str
    status: OriginTrialStatus
    tokensWithStatus: list[OriginTrialTokenWithStatus]


class SecurityOriginDetails(TypedDict):
    """Security origin details."""

    isLocalhost: bool


class Frame(TypedDict):
    """Frame information."""

    id: FrameId
    loaderId: LoaderId
    url: str
    domainAndRegistry: str
    securityOrigin: str
    mimeType: str
    secureContextType: SecureContextType
    crossOriginIsolatedContextType: CrossOriginIsolatedContextType
    gatedAPIFeatures: list[GatedAPIFeatures]
    parentId: NotRequired[FrameId]
    name: NotRequired[str]
    urlFragment: NotRequired[str]
    securityOriginDetails: NotRequired[SecurityOriginDetails]
    unreachableUrl: NotRequired[str]
    adFrameStatus: NotRequired[AdFrameStatus]


class FrameResource(TypedDict):
    """Frame resource information."""

    url: str
    type: ResourceType
    mimeType: str
    lastModified: NotRequired[TimeSinceEpoch]
    contentSize: NotRequired[float]
    failed: NotRequired[bool]
    canceled: NotRequired[bool]


class FrameResourceTree(TypedDict):
    """Frame resource tree."""

    frame: Frame
    resources: list[FrameResource]
    childFrames: NotRequired[list['FrameResourceTree']]


class FrameTree(TypedDict):
    """Frame tree."""

    frame: Frame
    childFrames: NotRequired[list['FrameTree']]


class NavigationEntry(TypedDict):
    """Navigation entry."""

    id: int
    url: str
    userTypedURL: str
    title: str
    transitionType: TransitionType


class ScreencastFrameMetadata(TypedDict):
    """Screencast frame metadata."""

    offsetTop: float
    pageScaleFactor: float
    deviceWidth: float
    deviceHeight: float
    scrollOffsetX: float
    scrollOffsetY: float
    timestamp: NotRequired[TimeSinceEpoch]


class AppManifestError(TypedDict):
    """App manifest error."""

    message: str
    critical: int
    line: int
    column: int


class AppManifestParsedProperties(TypedDict):
    """App manifest parsed properties."""

    scope: str


class LayoutViewport(TypedDict):
    """Layout viewport."""

    pageX: int
    pageY: int
    clientWidth: int
    clientHeight: int


class VisualViewport(TypedDict):
    """Visual viewport."""

    offsetX: float
    offsetY: float
    pageX: float
    pageY: float
    clientWidth: float
    clientHeight: float
    scale: float
    zoom: NotRequired[float]


class Viewport(TypedDict):
    """Viewport for capturing screenshot."""

    x: float
    y: float
    width: float
    height: float
    scale: float


class FontFamilies(TypedDict, total=False):
    """Font families."""

    standard: str
    fixed: str
    serif: str
    sansSerif: str
    cursive: str
    fantasy: str
    math: str


class ScriptFontFamilies(TypedDict):
    """Script font families."""

    script: str
    fontFamilies: FontFamilies


class FontSizes(TypedDict, total=False):
    """Font sizes."""

    standard: int
    fixed: int


class CompilationCacheParams(TypedDict):
    """Compilation cache parameters."""

    url: str
    eager: NotRequired[bool]


class FileFilter(TypedDict, total=False):
    """File filter."""

    name: str
    accepts: list[str]


class ImageResource(TypedDict):
    """Image resource."""

    url: str
    sizes: NotRequired[str]
    type: NotRequired[str]


class FileHandler(TypedDict):
    """File handler."""

    action: str
    name: str
    launchType: str
    icons: NotRequired[list[ImageResource]]
    accepts: NotRequired[list[FileFilter]]


class LaunchHandler(TypedDict):
    """Launch handler."""

    clientMode: str


class ProtocolHandler(TypedDict):
    """Protocol handler."""

    protocol: str
    url: str


class RelatedApplication(TypedDict):
    """Related application."""

    url: str
    id: NotRequired[str]


class ScopeExtension(TypedDict):
    """Scope extension."""

    origin: str
    hasOriginWildcard: bool


class Screenshot(TypedDict):
    """Screenshot."""

    image: ImageResource
    formFactor: str
    label: NotRequired[str]


class ShareTarget(TypedDict):
    """Share target."""

    action: str
    method: str
    enctype: str
    title: NotRequired[str]
    text: NotRequired[str]
    url: NotRequired[str]
    files: NotRequired[list[FileFilter]]


class Shortcut(TypedDict):
    """Shortcut."""

    name: str
    url: str


class WebAppManifest(TypedDict, total=False):
    """Web app manifest."""

    backgroundColor: str
    description: str
    dir: str
    display: str
    displayOverrides: list[str]
    fileHandlers: list[FileHandler]
    icons: list[ImageResource]
    id: str
    lang: str
    launchHandler: LaunchHandler
    name: str
    orientation: str
    preferRelatedApplications: bool
    protocolHandlers: list[ProtocolHandler]
    relatedApplications: list[RelatedApplication]
    scope: str
    scopeExtensions: list[ScopeExtension]
    screenshots: list[Screenshot]
    shareTarget: ShareTarget
    shortName: str
    shortcuts: list[Shortcut]
    startUrl: str
    themeColor: str


class InstallabilityErrorArgument(TypedDict):
    """Installability error argument."""

    name: str
    value: str


class InstallabilityError(TypedDict):
    """Installability error."""

    errorId: str
    errorArguments: list[InstallabilityErrorArgument]


class AutoResponseMode(str, Enum):
    """Auto response mode values."""

    NONE = 'none'
    AUTO_ACCEPT = 'autoAccept'
    AUTO_CHOOSE_TO_AUTH_ANOTHER_WAY = 'autoChooseToAuthAnotherWay'
    AUTO_REJECT = 'autoReject'
    AUTO_OPT_OUT = 'autoOptOut'


class WebLifecycleState(str, Enum):
    """Web lifecycle state values."""

    FROZEN = 'frozen'
    ACTIVE = 'active'


class ScreenshotFormat(str, Enum):
    """Screenshot format values."""

    JPEG = 'jpeg'
    PNG = 'png'
    WEBP = 'webp'

    @classmethod
    def has_value(cls, value: str) -> bool:
        """Check if value is a valid screenshot format."""
        return value in cls._value2member_map_

    @classmethod
    def get_value(cls, value: str) -> 'ScreenshotFormat':
        """Get the value of the screenshot format."""
        return cls(value)


class ScreencastFormat(str, Enum):
    """Screencast format values."""

    JPEG = 'jpeg'
    PNG = 'png'


class TransferMode(str, Enum):
    """Transfer mode values."""

    RETURN_AS_BASE64 = 'ReturnAsBase64'
    RETURN_AS_STREAM = 'ReturnAsStream'


================================================
FILE: pydoll/protocol/runtime/__init__.py
================================================
"""Runtime domain implementation."""


================================================
FILE: pydoll/protocol/runtime/events.py
================================================
from enum import Enum
from typing import Any

from typing_extensions import NotRequired, TypedDict

from pydoll.protocol.base import CDPEvent
from pydoll.protocol.runtime.types import (
    ExceptionDetails,
    ExecutionContextDescription,
    ExecutionContextId,
    RemoteObject,
    StackTrace,
    Timestamp,
)


class RuntimeEvent(str, Enum):
    """
    Events from the Runtime domain of the Chrome DevTools Protocol.

    This enumeration contains the names of Runtime-related events that can be
    received from the Chrome DevTools Protocol. These events provide information
    about JavaScript execution, console API calls, exceptions, and execution contexts.
    """

    CONSOLE_API_CALLED = 'Runtime.consoleAPICalled'
    """
    Issued when console API was called.

    Args:
        type (str): Type of the call.
            Allowed Values: log, debug, info, error, warning, dir, dirxml, table, trace,
            clear, startGroup, startGroupCollapsed, endGroup, assert, profile, profileEnd,
            count, timeEnd
        args (array[RemoteObject]): Call arguments.
        executionContextId (ExecutionContextId): Identifier of the context where the call was made.
        timestamp (Timestamp): Call timestamp.
        stackTrace (StackTrace): Stack trace captured when the call was made. The async stack
            chain is automatically reported for the following call types: assert, error,
            trace, warning. For other types the async call chain can be retrieved using
            Debugger.getStackTrace and stackTrace.parentId field.
        context (str): Console context descriptor for calls on non-default console context
            (not console.*): 'anonymous#unique-logger-id' for call on unnamed context,
            'name#unique-logger-id' for call on named context.
    """

    EXCEPTION_REVOKED = 'Runtime.exceptionRevoked'
    """
    Issued when unhandled exception was revoked.

    Args:
        reason (str): Reason describing why exception was revoked.
        exceptionId (int): The id of revoked exception, as reported in exceptionThrown.
    """

    EXCEPTION_THROWN = 'Runtime.exceptionThrown'
    """
    Issued when exception was thrown and unhandled.

    Args:
        timestamp (Timestamp): Timestamp of the exception.
        exceptionDetails (ExceptionDetails): Details about the exception.
    """

    EXECUTION_CONTEXT_CREATED = 'Runtime.executionContextCreated'
    """
    Issued when new execution context is created.

    Args:
        context (ExecutionContextDescription): A newly created execution context.
    """

    EXECUTION_CONTEXT_DESTROYED = 'Runtime.executionContextDestroyed'
    """
    Issued when execution context is destroyed.

    Args:
        executionContextId (ExecutionContextId): Id of the destroyed context.
        executionContextUniqueId (str): Unique Id of the destroyed context.
    """

    EXECUTION_CONTEXTS_CLEARED = 'Runtime.executionContextsCleared'
    """
    Issued when all executionContexts were cleared in browser.
    """

    INSPECT_REQUESTED = 'Runtime.inspectRequested'
    """
    Issued when object should be inspected
    (for example, as a result of inspect() command line API call).

    Args:
        object (RemoteObject): Object to inspect.
        hints (object): Hints.
        executionContextId (ExecutionContextId): Identifier of the context where the call was made.
    """

    BINDING_CALLED = 'Runtime.bindingCalled'
    """
    Notification is issued every time when binding is called.

    Args:
        name (str): Name of the binding.
        payload (str): Payload of the binding.
        executionContextId (ExecutionContextId): Identifier of the context where the call was made.
    """


class ConsoleAPICallType(str, Enum):
    """Console API call types."""

    LOG = 'log'
    DEBUG = 'debug'
    INFO = 'info'
    ERROR = 'error'
    WARNING = 'warning'
    DIR = 'dir'
    DIRXML = 'dirxml'
    TABLE = 'table'
    TRACE = 'trace'
    CLEAR = 'clear'
    START_GROUP = 'startGroup'
    START_GROUP_COLLAPSED = 'startGroupCollapsed'
    END_GROUP = 'endGroup'
    ASSERT = 'assert'
    PROFILE = 'profile'
    PROFILE_END = 'profileEnd'
    COUNT = 'count'
    TIME_END = 'timeEnd'


class BindingCalledEventParams(TypedDict):
    """Parameters for bindingCalled event."""

    name: str
    payload: str
    executionContextId: ExecutionContextId


class ConsoleAPICalledEventParams(TypedDict):
    """Parameters for consoleAPICalled event."""

    type: ConsoleAPICallType
    args: list[RemoteObject]
    executionContextId: ExecutionContextId
    timestamp: Timestamp
    stackTrace: NotRequired[StackTrace]
    context: NotRequired[str]


class ExceptionRevokedEventParams(TypedDict):
    """Parameters for exceptionRevoked event."""

    reason: str
    exceptionId: int


class ExceptionThrownEventParams(TypedDict):
    """Parameters for exceptionThrown event."""

    timestamp: Timestamp
    exceptionDetails: ExceptionDetails


class ExecutionContextCreatedEventParams(TypedDict):
    """Parameters for executionContextCreated event."""

    context: ExecutionContextDescription


class ExecutionContextDestroyedEventParams(TypedDict):
    """Parameters for executionContextDestroyed event."""

    executionContextId: ExecutionContextId
    executionContextUniqueId: str


class ExecutionContextsClearedEventParams(TypedDict):
    """Parameters for executionContextsCleared event."""

    pass


class InspectRequestedEventParams(TypedDict):
    """Parameters for inspectRequested event."""

    object: RemoteObject
    hints: dict[str, Any]
    executionContextId: NotRequired[ExecutionContextId]


# Event type aliases
BindingCalledEvent = CDPEvent[BindingCalledEventParams]
ConsoleAPICalledEvent = CDPEvent[ConsoleAPICalledEventParams]
ExceptionRevokedEvent = CDPEvent[ExceptionRevokedEventParams]
ExceptionThrownEvent = CDPEvent[ExceptionThrownEventParams]
ExecutionContextCreatedEvent = CDPEvent[ExecutionContextCreatedEventParams]
ExecutionContextDestroyedEvent = CDPEvent[ExecutionContextDestroyedEventParams]
ExecutionContextsClearedEvent = CDPEvent[ExecutionContextsClearedEventParams]
InspectRequestedEvent = CDPEvent[InspectRequestedEventParams]


================================================
FILE: pydoll/protocol/runtime/methods.py
================================================
from enum import Enum

from typing_extensions import NotRequired, TypedDict

from pydoll.protocol.base import Command, EmptyParams, EmptyResponse, Response
from pydoll.protocol.runtime.types import (
    CallArgument,
    ExceptionDetails,
    ExecutionContextId,
    InternalPropertyDescriptor,
    PrivatePropertyDescriptor,
    PropertyDescriptor,
    RemoteObject,
    RemoteObjectId,
    ScriptId,
    SerializationOptions,
    TimeDelta,
)


class RuntimeMethod(str, Enum):
    """Runtime domain method names."""

    ADD_BINDING = 'Runtime.addBinding'
    AWAIT_PROMISE = 'Runtime.awaitPromise'
    CALL_FUNCTION_ON = 'Runtime.callFunctionOn'
    COMPILE_SCRIPT = 'Runtime.compileScript'
    DISABLE = 'Runtime.disable'
    DISCARD_CONSOLE_ENTRIES = 'Runtime.discardConsoleEntries'
    ENABLE = 'Runtime.enable'
    EVALUATE = 'Runtime.evaluate'
    GET_EXCEPTION_DETAILS = 'Runtime.getExceptionDetails'
    GET_HEAP_USAGE = 'Runtime.getHeapUsage'
    GET_ISOLATE_ID = 'Runtime.getIsolateId'
    GET_PROPERTIES = 'Runtime.getProperties'
    GLOBAL_LEXICAL_SCOPE_NAMES = 'Runtime.globalLexicalScopeNames'
    QUERY_OBJECTS = 'Runtime.queryObjects'
    RELEASE_OBJECT = 'Runtime.releaseObject'
    RELEASE_OBJECT_GROUP = 'Runtime.releaseObjectGroup'
    REMOVE_BINDING = 'Runtime.removeBinding'
    RUN_IF_WAITING_FOR_DEBUGGER = 'Runtime.runIfWaitingForDebugger'
    RUN_SCRIPT = 'Runtime.runScript'
    SET_ASYNC_CALL_STACK_DEPTH = 'Runtime.setAsyncCallStackDepth'
    SET_CUSTOM_OBJECT_FORMATTER_ENABLED = 'Runtime.setCustomObjectFormatterEnabled'
    SET_MAX_CALL_STACK_SIZE_TO_CAPTURE = 'Runtime.setMaxCallStackSizeToCapture'
    TERMINATE_EXECUTION = 'Runtime.terminateExecution'


# Parameter types
class AddBindingParams(TypedDict):
    """Parameters for addBinding command."""

    name: str
    executionContextId: NotRequired[ExecutionContextId]
    executionContextName: NotRequired[str]


class AwaitPromiseParams(TypedDict):
    """Parameters for awaitPromise command."""

    promiseObjectId: RemoteObjectId
    returnByValue: NotRequired[bool]
    generatePreview: NotRequired[bool]


class CallFunctionOnParams(TypedDict):
    """Parameters for callFunctionOn command."""

    functionDeclaration: str
    objectId: NotRequired[RemoteObjectId]
    arguments: NotRequired[list[CallArgument]]
    silent: NotRequired[bool]
    returnByValue: NotRequired[bool]
    generatePreview: NotRequired[bool]
    userGesture: NotRequired[bool]
    awaitPromise: NotRequired[bool]
    executionContextId: NotRequired[ExecutionContextId]
    objectGroup: NotRequired[str]
    throwOnSideEffect: NotRequired[bool]
    uniqueContextId: NotRequired[str]
    serializationOptions: NotRequired[SerializationOptions]


class CompileScriptParams(TypedDict):
    """Parameters for compileScript command."""

    expression: str
    sourceURL: str
    persistScript: bool
    executionContextId: NotRequired[ExecutionContextId]


class EvaluateParams(TypedDict):
    """Parameters for evaluate command."""

    expression: str
    objectGroup: NotRequired[str]
    includeCommandLineAPI: NotRequired[bool]
    silent: NotRequired[bool]
    contextId: NotRequired[ExecutionContextId]
    returnByValue: NotRequired[bool]
    generatePreview: NotRequired[bool]
    userGesture: NotRequired[bool]
    awaitPromise: NotRequired[bool]
    throwOnSideEffect: NotRequired[bool]
    timeout: NotRequired[TimeDelta]
    disableBreaks: NotRequired[bool]
    replMode: NotRequired[bool]
    allowUnsafeEvalBlockedByCSP: NotRequired[bool]
    uniqueContextId: NotRequired[str]
    serializationOptions: NotRequired[SerializationOptions]


class GetExceptionDetailsParams(TypedDict):
    """Parameters for getExceptionDetails command."""

    errorObjectId: RemoteObjectId


class GetPropertiesParams(TypedDict):
    """Parameters for getProperties command."""

    objectId: RemoteObjectId
    ownProperties: NotRequired[bool]
    accessorPropertiesOnly: NotRequired[bool]
    generatePreview: NotRequired[bool]
    nonIndexedPropertiesOnly: NotRequired[bool]


class GlobalLexicalScopeNamesParams(TypedDict, total=False):
    """Parameters for globalLexicalScopeNames command."""

    executionContextId: ExecutionContextId


class QueryObjectsParams(TypedDict):
    """Parameters for queryObjects command."""

    prototypeObjectId: RemoteObjectId
    objectGroup: NotRequired[str]


class ReleaseObjectParams(TypedDict):
    """Parameters for releaseObject command."""

    objectId: RemoteObjectId


class ReleaseObjectGroupParams(TypedDict):
    """Parameters for releaseObjectGroup command."""

    objectGroup: str


class RemoveBindingParams(TypedDict):
    """Parameters for removeBinding command."""

    name: str


class RunScriptParams(TypedDict):
    """Parameters for runScript command."""

    scriptId: ScriptId
    executionContextId: NotRequired[ExecutionContextId]
    objectGroup: NotRequired[str]
    silent: NotRequired[bool]
    includeCommandLineAPI: NotRequired[bool]
    returnByValue: NotRequired[bool]
    generatePreview: NotRequired[bool]
    awaitPromise: NotRequired[bool]


class SetAsyncCallStackDepthParams(TypedDict):
    """Parameters for setAsyncCallStackDepth command."""

    maxDepth: int


class SetCustomObjectFormatterEnabledParams(TypedDict):
    """Parameters for setCustomObjectFormatterEnabled command."""

    enabled: bool


class SetMaxCallStackSizeToCaptureParams(TypedDict):
    """Parameters for setMaxCallStackSizeToCapture command."""

    size: int


# Result types
class AwaitPromiseResult(TypedDict):
    """Result for awaitPromise command."""

    result: RemoteObject
    exceptionDetails: NotRequired[ExceptionDetails]


class CallFunctionOnResult(TypedDict):
    """Result for callFunctionOn command."""

    result: RemoteObject
    exceptionDetails: NotRequired[ExceptionDetails]


class CompileScriptResult(TypedDict, total=False):
    """Result for compileScript command."""

    scriptId: ScriptId
    exceptionDetails: ExceptionDetails


class EvaluateResult(TypedDict):
    """Result for evaluate command."""

    result: RemoteObject
    exceptionDetails: NotRequired[ExceptionDetails]


class GetExceptionDetailsResult(TypedDict, total=False):
    """Result for getExceptionDetails command."""

    exceptionDetails: ExceptionDetails


class GetHeapUsageResult(TypedDict):
    """Result for getHeapUsage command."""

    usedSize: float
    totalSize: float
    embedderHeapUsedSize: float
    backingStorageSize: float


class GetIsolateIdResult(TypedDict):
    """Result for getIsolateId command."""

    id: str


class GetPropertiesResult(TypedDict):
    """Result for getProperties command."""

    result: list[PropertyDescriptor]
    internalProperties: NotRequired[list[InternalPropertyDescriptor]]
    privateProperties: NotRequired[list[PrivatePropertyDescriptor]]
    exceptionDetails: NotRequired[ExceptionDetails]


class GlobalLexicalScopeNamesResult(TypedDict):
    """Result for globalLexicalScopeNames command."""

    names: list[str]


class QueryObjectsResult(TypedDict):
    """Result for queryObjects command."""

    objects: RemoteObject


class RunScriptResult(TypedDict):
    """Result for runScript command."""

    result: RemoteObject
    exceptionDetails: NotRequired[ExceptionDetails]


# Response types
AwaitPromiseResponse = Response[AwaitPromiseResult]
CallFunctionOnResponse = Response[CallFunctionOnResult]
CompileScriptResponse = Response[CompileScriptResult]
EvaluateResponse = Response[EvaluateResult]
GetExceptionDetailsResponse = Response[GetExceptionDetailsResult]
GetHeapUsageResponse = Response[GetHeapUsageResult]
GetIsolateIdResponse = Response[GetIsolateIdResult]
GetPropertiesResponse = Response[GetPropertiesResult]
GlobalLexicalScopeNamesResponse = Response[GlobalLexicalScopeNamesResult]
QueryObjectsResponse = Response[QueryObjectsResult]
RunScriptResponse = Response[RunScriptResult]


# Command types
AddBindingCommand = Command[AddBindingParams, Response[EmptyResponse]]
AwaitPromiseCommand = Command[AwaitPromiseParams, AwaitPromiseResponse]
CallFunctionOnCommand = Command[CallFunctionOnParams, CallFunctionOnResponse]
CompileScriptCommand = Command[CompileScriptParams, CompileScriptResponse]
DisableCommand = Command[EmptyParams, Response[EmptyResponse]]
DiscardConsoleEntriesCommand = Command[EmptyParams, Response[EmptyResponse]]
EnableCommand = Command[EmptyParams, Response[EmptyResponse]]
EvaluateCommand = Command[EvaluateParams, EvaluateResponse]
GetExceptionDetailsCommand = Command[GetExceptionDetailsParams, GetExceptionDetailsResponse]
GetHeapUsageCommand = Command[EmptyParams, GetHeapUsageResponse]
GetIsolateIdCommand = Command[EmptyParams, GetIsolateIdResponse]
GetPropertiesCommand = Command[GetPropertiesParams, GetPropertiesResponse]
GlobalLexicalScopeNamesCommand = Command[
    GlobalLexicalScopeNamesParams, GlobalLexicalScopeNamesResponse
]
QueryObjectsCommand = Command[QueryObjectsParams, QueryObjectsResponse]
ReleaseObjectCommand = Command[ReleaseObjectParams, Response[EmptyResponse]]
ReleaseObjectGroupCommand = Command[ReleaseObjectGroupParams, Response[EmptyResponse]]
RemoveBindingCommand = Command[RemoveBindingParams, Response[EmptyResponse]]
RunIfWaitingForDebuggerCommand = Command[EmptyParams, Response[EmptyResponse]]
RunScriptCommand = Command[RunScriptParams, RunScriptResponse]
SetAsyncCallStackDepthCommand = Command[SetAsyncCallStackDepthParams, Response[EmptyResponse]]
SetCustomObjectFormatterEnabledCommand = Command[
    SetCustomObjectFormatterEnabledParams, Response[EmptyResponse]
]
SetMaxCallStackSizeToCaptureCommand = Command[
    SetMaxCallStackSizeToCaptureParams, Response[EmptyResponse]
]
TerminateExecutionCommand = Command[EmptyParams, Response[EmptyResponse]]


================================================
FILE: pydoll/protocol/runtime/types.py
================================================
from enum import Enum
from typing import Any

from typing_extensions import NotRequired, TypedDict

ScriptId = str
RemoteObjectId = str
UnserializableValue = str
ExecutionContextId = int
Timestamp = float
TimeDelta = float
UniqueDebuggerId = str


class SerializationType(str, Enum):
    """Serialization types."""

    DEEP = 'deep'
    JSON = 'json'
    ID_ONLY = 'idOnly'


class DeepSerializedValueType(str, Enum):
    """Deep serialized value types."""

    UNDEFINED = 'undefined'
    NULL = 'null'
    STRING = 'string'
    NUMBER = 'number'
    BOOLEAN = 'boolean'
    BIGINT = 'bigint'
    REGEXP = 'regexp'
    DATE = 'date'
    SYMBOL = 'symbol'
    ARRAY = 'array'
    OBJECT = 'object'
    FUNCTION = 'function'
    MAP = 'map'
    SET = 'set'
    WEAKMAP = 'weakmap'
    WEAKSET = 'weakset'
    ERROR = 'error'
    PROXY = 'proxy'
    PROMISE = 'promise'
    TYPEDARRAY = 'typedarray'
    ARRAYBUFFER = 'arraybuffer'
    NODE = 'node'
    WINDOW = 'window'
    GENERATOR = 'generator'


class RemoteObjectType(str, Enum):
    """Remote object types."""

    OBJECT = 'object'
    FUNCTION = 'function'
    UNDEFINED = 'undefined'
    STRING = 'string'
    NUMBER = 'number'
    BOOLEAN = 'boolean'
    SYMBOL = 'symbol'
    BIGINT = 'bigint'


class RemoteObjectSubtype(str, Enum):
    """Remote object subtypes."""

    ARRAY = 'array'
    NULL = 'null'
    NODE = 'node'
    REGEXP = 'regexp'
    DATE = 'date'
    MAP = 'map'
    SET = 'set'
    WEAKMAP = 'weakmap'
    WEAKSET = 'weakset'
    ITERATOR = 'iterator'
    GENERATOR = 'generator'
    ERROR = 'error'
    PROXY = 'proxy'
    PROMISE = 'promise'
    TYPEDARRAY = 'typedarray'
    ARRAYBUFFER = 'arraybuffer'
    DATAVIEW = 'dataview'
    WEBASSEMBLYMEMORY = 'webassemblymemory'
    WASMVALUE = 'wasmvalue'


class ObjectPreviewType(str, Enum):
    """Object preview types."""

    OBJECT = 'object'
    FUNCTION = 'function'
    UNDEFINED = 'undefined'
    STRING = 'string'
    NUMBER = 'number'
    BOOLEAN = 'boolean'
    SYMBOL = 'symbol'
    BIGINT = 'bigint'


class ObjectPreviewSubtype(str, Enum):
    """Object preview subtypes."""

    ARRAY = 'array'
    NULL = 'null'
    NODE = 'node'
    REGEXP = 'regexp'
    DATE = 'date'
    MAP = 'map'
    SET = 'set'
    WEAKMAP = 'weakmap'
    WEAKSET = 'weakset'
    ITERATOR = 'iterator'
    GENERATOR = 'generator'
    ERROR = 'error'
    PROXY = 'proxy'
    PROMISE = 'promise'
    TYPEDARRAY = 'typedarray'
    ARRAYBUFFER = 'arraybuffer'
    DATAVIEW = 'dataview'
    WEBASSEMBLYMEMORY = 'webassemblymemory'
    WASMVALUE = 'wasmvalue'


class PropertyPreviewType(str, Enum):
    """Property preview types."""

    OBJECT = 'object'
    FUNCTION = 'function'
    UNDEFINED = 'undefined'
    STRING = 'string'
    NUMBER = 'number'
    BOOLEAN = 'boolean'
    SYMBOL = 'symbol'
    ACCESSOR = 'accessor'
    BIGINT = 'bigint'


class PropertyPreviewSubtype(str, Enum):
    """Property preview subtypes."""

    ARRAY = 'array'
    NULL = 'null'
    NODE = 'node'
    REGEXP = 'regexp'
    DATE = 'date'
    MAP = 'map'
    SET = 'set'
    WEAKMAP = 'weakmap'
    WEAKSET = 'weakset'
    ITERATOR = 'iterator'
    GENERATOR = 'generator'
    ERROR = 'error'
    PROXY = 'proxy'
    PROMISE = 'promise'
    TYPEDARRAY = 'typedarray'
    ARRAYBUFFER = 'arraybuffer'
    DATAVIEW = 'dataview'
    WEBASSEMBLYMEMORY = 'webassemblymemory'
    WASMVALUE = 'wasmvalue'


class SerializationOptions(TypedDict):
    """Represents options for serialization."""

    serialization: SerializationType
    maxDepth: NotRequired[int]
    additionalParameters: NotRequired[dict[str, Any]]


class DeepSerializedValue(TypedDict):
    """Represents deep serialized value."""

    type: DeepSerializedValueType
    value: NotRequired[Any]
    objectId: NotRequired[str]
    weakLocalObjectReference: NotRequired[int]


class CustomPreview(TypedDict):
    """Custom preview for objects."""

    header: str
    bodyGetterId: NotRequired[RemoteObjectId]


class PropertyPreview(TypedDict):
    """Property preview for objects."""

    name: str
    type: PropertyPreviewType
    value: NotRequired[str]
    valuePreview: NotRequired['ObjectPreview']
    subtype: NotRequired[PropertyPreviewSubtype]


class EntryPreview(TypedDict):
    """Entry preview for collections."""

    value: 'ObjectPreview'
    key: NotRequired['ObjectPreview']


class ObjectPreview(TypedDict):
    """Object containing abbreviated remote object value."""

    type: ObjectPreviewType
    overflow: bool
    properties: list[PropertyPreview]
    subtype: NotRequired[ObjectPreviewSubtype]
    description: NotRequired[str]
    entries: NotRequired[list[EntryPreview]]


class RemoteObject(TypedDict):
    """Mirror object referencing original JavaScript object."""

    type: RemoteObjectType
    subtype: NotRequired[RemoteObjectSubtype]
    className: NotRequired[str]
    value: NotRequired[Any]
    unserializableValue: NotRequired[UnserializableValue]
    description: NotRequired[str]
    deepSerializedValue: NotRequired[DeepSerializedValue]
    objectId: NotRequired[RemoteObjectId]
    preview: NotRequired[ObjectPreview]
    customPreview: NotRequired[CustomPreview]


class PropertyDescriptor(TypedDict):
    """Object property descriptor."""

    name: str
    configurable: bool
    enumerable: bool
    value: NotRequired[RemoteObject]
    writable: NotRequired[bool]
    get: NotRequired[RemoteObject]
    set: NotRequired[RemoteObject]
    wasThrown: NotRequired[bool]
    isOwn: NotRequired[bool]
    symbol: NotRequired[RemoteObject]


class InternalPropertyDescriptor(TypedDict):
    """Object internal property descriptor."""

    name: str
    value: NotRequired[RemoteObject]


class PrivatePropertyDescriptor(TypedDict):
    """Object private field descriptor."""

    name: str
    value: NotRequired[RemoteObject]
    get: NotRequired[RemoteObject]
    set: NotRequired[RemoteObject]


class CallArgument(TypedDict, total=False):
    """Represents function call argument."""

    value: Any
    unserializableValue: UnserializableValue
    objectId: RemoteObjectId


class ExecutionContextDescription(TypedDict):
    """Description of an isolated world."""

    id: ExecutionContextId
    origin: str
    name: str
    uniqueId: str
    auxData: NotRequired[dict[str, Any]]


class ExceptionDetails(TypedDict):
    """Detailed information about exception."""

    exceptionId: int
    text: str
    lineNumber: int
    columnNumber: int
    scriptId: NotRequired[ScriptId]
    url: NotRequired[str]
    stackTrace: NotRequired['StackTrace']
    exception: NotRequired[RemoteObject]
    executionContextId: NotRequired[ExecutionContextId]
    exceptionMetaData: NotRequired[dict[str, Any]]


class CallFrame(TypedDict):
    """Stack entry for runtime errors and assertions."""

    functionName: str
    scriptId: ScriptId
    url: str
    lineNumber: int
    columnNumber: int


class StackTraceId(TypedDict):
    """Stack trace identifier."""

    id: str
    debuggerId: NotRequired[UniqueDebuggerId]


class StackTrace(TypedDict):
    """Call frames for assertions or error messages."""

    callFrames: list[CallFrame]
    description: NotRequired[str]
    parent: NotRequired['StackTrace']
    parentId: NotRequired[StackTraceId]


================================================
FILE: pydoll/protocol/security/types.py
================================================
from enum import Enum


class MixedContentType(str, Enum):
    """
    The mixed content type of the request.
    """

    BLOCKABLE = 'blockable'
    OPTIONALLY_BLOCKABLE = 'optionally-blockable'
    NONE = 'none'


class SecurityState(str, Enum):
    """
    The security state of the page.
    """

    UNKNOWN = 'unknown'
    NEUTRAL = 'neutral'
    SAFE = 'safe'
    INSECURE = 'insecure'
    SECURE = 'secure'
    INFO = 'info'
    INSECURE_BROKEN = 'insecure-broken'


================================================
FILE: pydoll/protocol/storage/__init__.py
================================================
"""Storage domain implementation."""


================================================
FILE: pydoll/protocol/storage/events.py
================================================
from enum import Enum
from typing import Any

from typing_extensions import NotRequired, TypedDict

from pydoll.protocol.base import CDPEvent
from pydoll.protocol.network.types import RequestId, TimeSinceEpoch
from pydoll.protocol.page.types import FrameId
from pydoll.protocol.storage.types import (
    AttributionReportingAggregatableResult,
    AttributionReportingEventLevelResult,
    AttributionReportingReportResult,
    AttributionReportingSourceRegistration,
    AttributionReportingSourceRegistrationResult,
    AttributionReportingTriggerRegistration,
    InterestGroupAccessType,
    InterestGroupAuctionEventType,
    InterestGroupAuctionFetchType,
    InterestGroupAuctionId,
    SharedStorageAccessMethod,
    SharedStorageAccessParams,
    SharedStorageAccessScope,
    StorageBucketInfo,
)
from pydoll.protocol.target.types import TargetID


class StorageEvent(str, Enum):
    """
    Events from the Storage domain of the Chrome DevTools Protocol.

    This enumeration contains the names of Storage-related events that can be
    received from the Chrome DevTools Protocol. These events provide information
    about changes to various browser storage mechanisms including Cache Storage,
    IndexedDB, Interest Groups, Shared Storage, and Storage Buckets.
    """

    CACHE_STORAGE_CONTENT_UPDATED = 'Storage.cacheStorageContentUpdated'
    """
    A cache's contents have been modified.

    Args:
        origin (str): Origin to update.
        storageKey (str): Storage key to update.
        bucketId (str): Storage bucket to update.
        cacheName (str): Name of cache in origin.
    """

    CACHE_STORAGE_LIST_UPDATED = 'Storage.cacheStorageListUpdated'
    """
    A cache has been added/deleted.

    Args:
        origin (str): Origin to update.
        storageKey (str): Storage key to update.
        bucketId (str): Storage bucket to update.
    """

    INDEXED_DB_CONTENT_UPDATED = 'Storage.indexedDBContentUpdated'
    """
    The origin's IndexedDB object store has been modified.

    Args:
        origin (str): Origin to update.
        storageKey (str): Storage key to update.
        bucketId (str): Storage bucket to update.
        databaseName (str): Database to update.
        objectStoreName (str): ObjectStore to update.
    """

    INDEXED_DB_LIST_UPDATED = 'Storage.indexedDBListUpdated'
    """
    The origin's IndexedDB database list has been modified.

    Args:
        origin (str): Origin to update.
        storageKey (str): Storage key to update.
        bucketId (str): Storage bucket to update.
    """

    INTEREST_GROUP_ACCESSED = 'Storage.interestGroupAccessed'
    """
    One of the interest groups was accessed. Note that these events are global
    to all targets sharing an interest group store.

    Args:
        accessTime (Network.TimeSinceEpoch): Time of the access.
        type (InterestGroupAccessType): Type of access.
        ownerOrigin (str): Owner origin.
        name (str): Name of the interest group.
        componentSellerOrigin (str): For topLevelBid/topLevelAdditionalBid, and when
            appropriate, win and additionalBidWin.
        bid (number): For bid or somethingBid event, if done locally and not on a server.
        bidCurrency (str): Currency of the bid.
        uniqueAuctionId (InterestGroupAuctionId): For non-global events --- links
            to interestGroupAuctionEvent.
    """

    INTEREST_GROUP_AUCTION_EVENT_OCCURRED = 'Storage.interestGroupAuctionEventOccurred'
    """
    An auction involving interest groups is taking place. These events are target-specific.

    Args:
        eventTime (Network.TimeSinceEpoch): Time of the event.
        type (InterestGroupAuctionEventType): Type of auction event.
        uniqueAuctionId (InterestGroupAuctionId): Unique identifier for the auction.
        parentAuctionId (InterestGroupAuctionId): Set for child auctions.
        auctionConfig (object): Set for started and configResolved.
    """

    INTEREST_GROUP_AUCTION_NETWORK_REQUEST_CREATED = (
        'Storage.interestGroupAuctionNetworkRequestCreated'
    )
    """
    Specifies which auctions a particular network fetch may be related to, and in what role.
    Note that it is not ordered with respect to Network.requestWillBeSent (but will happen
    before loadingFinished loadingFailed).

    Args:
        type (InterestGroupAuctionFetchType): Type of fetch.
        requestId (Network.RequestId): Request identifier.
        auctions (array[InterestGroupAuctionId]): This is the set of the auctions using the
            worklet that issued this request. In the case of trusted signals, it's possible
            that only some of them actually care about the keys being queried.
    """

    SHARED_STORAGE_ACCESSED = 'Storage.sharedStorageAccessed'
    """
    Shared storage was accessed by the associated page. The following parameters
    are included in all events.

    Args:
        accessTime (Network.TimeSinceEpoch): Time of the access.
        scope (SharedStorageAccessScope): Enum value indicating the access scope.
        method (SharedStorageAccessMethod): Enum value indicating the Shared Storage API
            method invoked.
        mainFrameId (Page.FrameId): DevTools Frame Token for the primary frame tree's root.
        ownerOrigin (str): Serialization of the origin owning the Shared Storage data.
        ownerSite (str): Serialization of the site owning the Shared Storage data.
        params (SharedStorageAccessParams): The sub-parameters wrapped by params are all
            optional and their presence/absence depends on type.
    """

    SHARED_STORAGE_WORKLET_OPERATION_EXECUTION_FINISHED = (
        'Storage.sharedStorageWorkletOperationExecutionFinished'
    )
    """
    A shared storage run or selectURL operation finished its execution.
    The following parameters are included in all events.

    Args:
        finishedTime (Network.TimeSinceEpoch): Time that the operation finished.
        executionTime (int): Time, in microseconds, from start of shared storage JS API
            call until end of operation execution in the worklet.
        method (SharedStorageAccessMethod): Enum value indicating the Shared Storage API
            method invoked.
        operationId (str): ID of the operation call.
        workletTargetId (Target.TargetID): Hex representation of the DevTools token used
            as the TargetID for the associated shared storage worklet.
        mainFrameId (Page.FrameId): DevTools Frame Token for the primary frame tree's root.
        ownerOrigin (str): Serialization of the origin owning the Shared Storage data.
    """

    STORAGE_BUCKET_CREATED_OR_UPDATED = 'Storage.storageBucketCreatedOrUpdated'
    """
    Fired when a storage bucket is created or updated.

    Args:
        bucketInfo (StorageBucketInfo): Information about the storage bucket.
    """

    STORAGE_BUCKET_DELETED = 'Storage.storageBucketDeleted'
    """
    Fired when a storage bucket is deleted.

    Args:
        bucketId (str): ID of the deleted storage bucket.
    """

    ATTRIBUTION_REPORTING_SOURCE_REGISTERED = 'Storage.attributionReportingSourceRegistered'
    """
    Fired when an attribution source is registered.

    Args:
        registration (AttributionReportingSourceRegistration): Registration details.
        result (AttributionReportingSourceRegistrationResult): Result of the registration.
    """

    ATTRIBUTION_REPORTING_TRIGGER_REGISTERED = 'Storage.attributionReportingTriggerRegistered'
    """
    Fired when an attribution trigger is registered.

    Args:
        registration (AttributionReportingTriggerRegistration): Registration details.
        eventLevel (AttributionReportingEventLevelResult): Event level result.
        aggregatable (AttributionReportingAggregatableResult): Aggregatable result.
    """

    ATTRIBUTION_REPORTING_REPORT_SENT = 'Storage.attributionReportingReportSent'
    """
    Fired when an attribution report is sent.

    Args:
        url (str): URL the report was sent to.
        body (object): Body of the report.
        result (AttributionReportingReportResult): Result of the report sending.
        netError (int): If result is sent, populated with net/HTTP status.
        netErrorName (str): Name of the network error if any.
        httpStatusCode (int): HTTP status code if available.
    """

    ATTRIBUTION_REPORTING_VERBOSE_DEBUG_REPORT_SENT = (
        'Storage.attributionReportingVerboseDebugReportSent'
    )
    """
    Fired when a verbose debug report is sent for an attribution source.

    Args:
        url (str): URL the report was sent to.
        body (array[object]): Body of the report.
        netError (int): If result is sent, populated with net/HTTP status.
        netErrorName (str): Name of the network error if any.
        httpStatusCode (int): HTTP status code if available.
    """


class CacheStorageContentUpdatedEventParams(TypedDict):
    origin: str
    storageKey: str
    bucketId: str
    cacheName: str


class CacheStorageListUpdatedEventParams(TypedDict):
    origin: str
    storageKey: str
    bucketId: str


class IndexedDBContentUpdatedEventParams(TypedDict):
    origin: str
    storageKey: str
    bucketId: str
    databaseName: str
    objectStoreName: str


class IndexedDBListUpdatedEventParams(TypedDict):
    origin: str
    storageKey: str
    bucketId: str


class InterestGroupAccessedEventParams(TypedDict):
    accessTime: TimeSinceEpoch
    type: InterestGroupAccessType
    ownerOrigin: str
    name: str
    componentSellerOrigin: NotRequired[str]
    bid: NotRequired[float]
    bidCurrency: NotRequired[str]
    uniqueAuctionId: NotRequired[InterestGroupAuctionId]


class InterestGroupAuctionEventOccurredEventParams(TypedDict):
    eventTime: TimeSinceEpoch
    type: InterestGroupAuctionEventType
    uniqueAuctionId: InterestGroupAuctionId
    parentAuctionId: NotRequired[InterestGroupAuctionId]
    auctionConfig: NotRequired[dict[str, Any]]


class InterestGroupAuctionNetworkRequestCreatedEventParams(TypedDict):
    type: InterestGroupAuctionFetchType
    requestId: RequestId
    auctions: list[InterestGroupAuctionId]


class SharedStorageAccessedEventParams(TypedDict):
    accessTime: TimeSinceEpoch
    scope: SharedStorageAccessScope
    method: SharedStorageAccessMethod
    mainFrameId: FrameId
    ownerOrigin: str
    ownerSite: str
    params: SharedStorageAccessParams


class SharedStorageWorkletOperationExecutionFinishedEventParams(TypedDict):
    finishedTime: TimeSinceEpoch
    executionTime: int
    method: SharedStorageAccessMethod
    operationId: str
    workletTargetId: TargetID
    mainFrameId: FrameId
    ownerOrigin: str


class StorageBucketCreatedOrUpdatedEventParams(TypedDict):
    bucketInfo: StorageBucketInfo


class StorageBucketDeletedEventParams(TypedDict):
    bucketId: str


class AttributionReportingSourceRegisteredEventParams(TypedDict):
    registration: AttributionReportingSourceRegistration
    result: AttributionReportingSourceRegistrationResult


class AttributionReportingTriggerRegisteredEventParams(TypedDict):
    registration: AttributionReportingTriggerRegistration
    eventLevel: AttributionReportingEventLevelResult
    aggregatable: AttributionReportingAggregatableResult


class AttributionReportingReportSentEventParams(TypedDict):
    url: str
    body: dict[str, Any]
    result: AttributionReportingReportResult
    netError: NotRequired[int]
    netErrorName: NotRequired[str]
    httpStatusCode: NotRequired[int]


class AttributionReportingVerboseDebugReportSentEventParams(TypedDict):
    url: str
    body: NotRequired[list[dict[str, Any]]]
    netError: NotRequired[int]
    netErrorName: NotRequired[str]
    httpStatusCode: NotRequired[int]


CacheStorageContentUpdated = CDPEvent[CacheStorageContentUpdatedEventParams]
CacheStorageListUpdated = CDPEvent[CacheStorageListUpdatedEventParams]
IndexedDBContentUpdated = CDPEvent[IndexedDBContentUpdatedEventParams]
IndexedDBListUpdated = CDPEvent[IndexedDBListUpdatedEventParams]
InterestGroupAccessed = CDPEvent[InterestGroupAccessedEventParams]
InterestGroupAuctionEventOccurred = CDPEvent[InterestGroupAuctionEventOccurredEventParams]
InterestGroupAuctionNetworkRequestCreated = CDPEvent[
    InterestGroupAuctionNetworkRequestCreatedEventParams
]
SharedStorageAccessed = CDPEvent[SharedStorageAccessedEventParams]
SharedStorageWorkletOperationExecutionFinished = CDPEvent[
    SharedStorageWorkletOperationExecutionFinishedEventParams
]
StorageBucketCreatedOrUpdated = CDPEvent[StorageBucketCreatedOrUpdatedEventParams]
StorageBucketDeleted = CDPEvent[StorageBucketDeletedEventParams]
AttributionReportingSourceRegistered = CDPEvent[AttributionReportingSourceRegisteredEventParams]
AttributionReportingTriggerRegistered = CDPEvent[AttributionReportingTriggerRegisteredEventParams]
AttributionReportingReportSent = CDPEvent[AttributionReportingReportSentEventParams]
AttributionReportingVerboseDebugReportSent = CDPEvent[
    AttributionReportingVerboseDebugReportSentEventParams
]


================================================
FILE: pydoll/protocol/storage/methods.py
================================================
from enum import Enum

from typing_extensions import NotRequired, TypedDict

from pydoll.protocol.base import Command, EmptyParams, EmptyResponse, Response
from pydoll.protocol.browser.types import BrowserContextID
from pydoll.protocol.network.types import Cookie, CookieParam
from pydoll.protocol.page.types import FrameId
from pydoll.protocol.storage.types import (
    RelatedWebsiteSet,
    SerializedStorageKey,
    SharedStorageEntry,
    SharedStorageMetadata,
    StorageBucket,
    TrustTokens,
    UsageForType,
)


class StorageMethod(str, Enum):
    CLEAR_COOKIES = 'Storage.clearCookies'
    CLEAR_DATA_FOR_ORIGIN = 'Storage.clearDataForOrigin'
    CLEAR_DATA_FOR_STORAGE_KEY = 'Storage.clearDataForStorageKey'
    GET_COOKIES = 'Storage.getCookies'
    GET_STORAGE_KEY_FOR_FRAME = 'Storage.getStorageKeyForFrame'
    GET_USAGE_AND_QUOTA = 'Storage.getUsageAndQuota'
    SET_COOKIES = 'Storage.setCookies'
    SET_PROTECTED_AUDIENCE_K_ANONYMITY = 'Storage.setProtectedAudienceKAnonymity'
    TRACK_CACHE_STORAGE_FOR_ORIGIN = 'Storage.trackCacheStorageForOrigin'
    TRACK_CACHE_STORAGE_FOR_STORAGE_KEY = 'Storage.trackCacheStorageForStorageKey'
    TRACK_INDEXED_DB_FOR_ORIGIN = 'Storage.trackIndexedDBForOrigin'
    TRACK_INDEXED_DB_FOR_STORAGE_KEY = 'Storage.trackIndexedDBForStorageKey'
    UNTRACK_CACHE_STORAGE_FOR_ORIGIN = 'Storage.untrackCacheStorageForOrigin'
    UNTRACK_CACHE_STORAGE_FOR_STORAGE_KEY = 'Storage.untrackCacheStorageForStorageKey'
    UNTRACK_INDEXED_DB_FOR_ORIGIN = 'Storage.untrackIndexedDBForOrigin'
    UNTRACK_INDEXED_DB_FOR_STORAGE_KEY = 'Storage.untrackIndexedDBForStorageKey'
    CLEAR_SHARED_STORAGE_ENTRIES = 'Storage.clearSharedStorageEntries'
    CLEAR_TRUST_TOKENS = 'Storage.clearTrustTokens'
    DELETE_SHARED_STORAGE_ENTRY = 'Storage.deleteSharedStorageEntry'
    DELETE_STORAGE_BUCKET = 'Storage.deleteStorageBucket'
    GET_AFFECTED_URLS_FOR_THIRD_PARTY_COOKIE_METADATA = (
        'Storage.getAffectedUrlsForThirdPartyCookieMetadata'
    )
    GET_INTEREST_GROUP_DETAILS = 'Storage.getInterestGroupDetails'
    GET_RELATED_WEBSITE_SETS = 'Storage.getRelatedWebsiteSets'
    GET_SHARED_STORAGE_ENTRIES = 'Storage.getSharedStorageEntries'
    GET_SHARED_STORAGE_METADATA = 'Storage.getSharedStorageMetadata'
    GET_TRUST_TOKENS = 'Storage.getTrustTokens'
    OVERRIDE_QUOTA_FOR_ORIGIN = 'Storage.overrideQuotaForOrigin'
    RESET_SHARED_STORAGE_BUDGET = 'Storage.resetSharedStorageBudget'
    RUN_BOUNCE_TRACKING_MITIGATIONS = 'Storage.runBounceTrackingMitigations'
    SEND_PENDING_ATTRIBUTION_REPORTS = 'Storage.sendPendingAttributionReports'
    SET_ATTRIBUTION_REPORTING_LOCAL_TESTING_MODE = 'Storage.setAttributionReportingLocalTestingMode'
    SET_ATTRIBUTION_REPORTING_TRACKING = 'Storage.setAttributionReportingTracking'
    SET_INTEREST_GROUP_AUCTION_TRACKING = 'Storage.setInterestGroupAuctionTracking'
    SET_INTEREST_GROUP_TRACKING = 'Storage.setInterestGroupTracking'
    SET_SHARED_STORAGE_ENTRY = 'Storage.setSharedStorageEntry'
    SET_SHARED_STORAGE_TRACKING = 'Storage.setSharedStorageTracking'
    SET_STORAGE_BUCKET_TRACKING = 'Storage.setStorageBucketTracking'


class GetStorageKeyForFrameParams(TypedDict):
    frameId: FrameId


class GetStorageKeyForFrameResult(TypedDict):
    storageKey: SerializedStorageKey


class ClearDataForOriginParams(TypedDict):
    origin: str
    storageTypes: str


class ClearDataForStorageKeyParams(TypedDict):
    storageKey: str
    storageTypes: str


class GetCookiesParams(TypedDict):
    browserContextId: NotRequired[BrowserContextID]


class GetCookiesResult(TypedDict):
    cookies: list[Cookie]


class SetCookiesParams(TypedDict):
    cookies: list[CookieParam]
    browserContextId: NotRequired[BrowserContextID]


class ClearCookiesParams(TypedDict):
    browserContextId: NotRequired[BrowserContextID]


class GetUsageAndQuotaParams(TypedDict):
    origin: str


class GetUsageAndQuotaResult(TypedDict):
    usage: float
    quota: float
    overrideActive: bool
    usageBreakdown: list[UsageForType]


class OverrideQuotaForOriginParams(TypedDict):
    origin: str
    quotaSize: NotRequired[float]


class TrackCacheStorageForOriginParams(TypedDict):
    origin: str


class TrackCacheStorageForStorageKeyParams(TypedDict):
    storageKey: str


class TrackIndexedDBForOriginParams(TypedDict):
    origin: str


class TrackIndexedDBForStorageKeyParams(TypedDict):
    storageKey: str


class UntrackCacheStorageForOriginParams(TypedDict):
    origin: str


class UntrackCacheStorageForStorageKeyParams(TypedDict):
    storageKey: str


class UntrackIndexedDBForOriginParams(TypedDict):
    origin: str


class UntrackIndexedDBForStorageKeyParams(TypedDict):
    storageKey: str


class GetTrustTokensResult(TypedDict):
    tokens: list[TrustTokens]


class ClearTrustTokensParams(TypedDict):
    issuerOrigin: str


class ClearTrustTokensResult(TypedDict):
    didDeleteTokens: bool


class GetInterestGroupDetailsParams(TypedDict):
    ownerOrigin: str
    name: str


class GetInterestGroupDetailsResult(TypedDict):
    details: dict


class SetInterestGroupTrackingParams(TypedDict):
    enable: bool


class SetInterestGroupAuctionTrackingParams(TypedDict):
    enable: bool


class GetSharedStorageMetadataParams(TypedDict):
    ownerOrigin: str


class GetSharedStorageMetadataResult(TypedDict):
    metadata: SharedStorageMetadata


class GetSharedStorageEntriesParams(TypedDict):
    ownerOrigin: str


class GetSharedStorageEntriesResult(TypedDict):
    entries: list[SharedStorageEntry]


class SetSharedStorageEntryParams(TypedDict):
    ownerOrigin: str
    key: str
    value: str
    ignoreIfPresent: NotRequired[bool]


class DeleteSharedStorageEntryParams(TypedDict):
    ownerOrigin: str
    key: str


class ClearSharedStorageEntriesParams(TypedDict):
    ownerOrigin: str


class ResetSharedStorageBudgetParams(TypedDict):
    ownerOrigin: str


class SetSharedStorageTrackingParams(TypedDict):
    enable: bool


class SetStorageBucketTrackingParams(TypedDict):
    storageKey: str
    enable: bool


class DeleteStorageBucketParams(TypedDict):
    bucket: StorageBucket


class RunBounceTrackingMitigationsResult(TypedDict):
    deletedSites: list[str]


class SetAttributionReportingLocalTestingModeParams(TypedDict):
    enabled: bool


class SetAttributionReportingTrackingParams(TypedDict):
    enable: bool


class SendPendingAttributionReportsResult(TypedDict):
    numSent: int


class GetRelatedWebsiteSetsResult(TypedDict):
    sets: list[RelatedWebsiteSet]


class GetAffectedUrlsForThirdPartyCookieMetadataParams(TypedDict):
    firstPartyUrl: str
    thirdPartyUrls: list[str]


class GetAffectedUrlsForThirdPartyCookieMetadataResult(TypedDict):
    matchedUrls: list[str]


class SetProtectedAudienceKAnonymityParams(TypedDict):
    owner: str
    name: str
    hashes: list[str]


GetStorageKeyForFrameResponse = Response[GetStorageKeyForFrameResult]
GetCookiesResponse = Response[GetCookiesResult]
GetUsageAndQuotaResponse = Response[GetUsageAndQuotaResult]
GetTrustTokensResponse = Response[GetTrustTokensResult]
GetInterestGroupDetailsResponse = Response[GetInterestGroupDetailsResult]
GetSharedStorageMetadataResponse = Response[GetSharedStorageMetadataResult]
GetSharedStorageEntriesResponse = Response[GetSharedStorageEntriesResult]
RunBounceTrackingMitigationsResponse = Response[RunBounceTrackingMitigationsResult]
SendPendingAttributionReportsResponse = Response[SendPendingAttributionReportsResult]
GetRelatedWebsiteSetsResponse = Response[GetRelatedWebsiteSetsResult]
GetAffectedUrlsForThirdPartyCookieMetadataResponse = Response[
    GetAffectedUrlsForThirdPartyCookieMetadataResult
]


GetStorageKeyForFrameCommand = Command[GetStorageKeyForFrameParams, GetStorageKeyForFrameResponse]
ClearDataForOriginCommand = Command[ClearDataForOriginParams, Response[EmptyResponse]]
ClearDataForStorageKeyCommand = Command[ClearDataForStorageKeyParams, Response[EmptyResponse]]
GetCookiesCommand = Command[GetCookiesParams, GetCookiesResponse]
SetCookiesCommand = Command[SetCookiesParams, Response[EmptyResponse]]
ClearCookiesCommand = Command[ClearCookiesParams, Response[EmptyResponse]]
GetUsageAndQuotaCommand = Command[GetUsageAndQuotaParams, GetUsageAndQuotaResponse]
OverrideQuotaForOriginCommand = Command[OverrideQuotaForOriginParams, Response[EmptyResponse]]
TrackCacheStorageForOriginCommand = Command[
    TrackCacheStorageForOriginParams, Response[EmptyResponse]
]
TrackCacheStorageForStorageKeyCommand = Command[
    TrackCacheStorageForStorageKeyParams, Response[EmptyResponse]
]
TrackIndexedDBForOriginCommand = Command[TrackIndexedDBForOriginParams, Response[EmptyResponse]]
TrackIndexedDBForStorageKeyCommand = Command[
    TrackIndexedDBForStorageKeyParams, Response[EmptyResponse]
]
UntrackCacheStorageForOriginCommand = Command[
    UntrackCacheStorageForOriginParams, Response[EmptyResponse]
]
UntrackCacheStorageForStorageKeyCommand = Command[
    UntrackCacheStorageForStorageKeyParams, Response[EmptyResponse]
]
UntrackIndexedDBForOriginCommand = Command[UntrackIndexedDBForOriginParams, Response[EmptyResponse]]
UntrackIndexedDBForStorageKeyCommand = Command[
    UntrackIndexedDBForStorageKeyParams, Response[EmptyResponse]
]
GetTrustTokensCommand = Command[EmptyParams, GetTrustTokensResponse]
ClearTrustTokensCommand = Command[ClearTrustTokensParams, Response[EmptyResponse]]
GetInterestGroupDetailsCommand = Command[
    GetInterestGroupDetailsParams, GetInterestGroupDetailsResponse
]
SetInterestGroupTrackingCommand = Command[SetInterestGroupTrackingParams, Response[EmptyResponse]]
SetInterestGroupAuctionTrackingCommand = Command[
    SetInterestGroupAuctionTrackingParams, Response[EmptyResponse]
]
GetSharedStorageMetadataCommand = Command[
    GetSharedStorageMetadataParams, GetSharedStorageMetadataResponse
]
GetSharedStorageEntriesCommand = Command[
    GetSharedStorageEntriesParams, GetSharedStorageEntriesResponse
]
SetSharedStorageEntryCommand = Command[SetSharedStorageEntryParams, Response[EmptyResponse]]
DeleteSharedStorageEntryCommand = Command[DeleteSharedStorageEntryParams, Response[EmptyResponse]]
ClearSharedStorageEntriesCommand = Command[ClearSharedStorageEntriesParams, Response[EmptyResponse]]
ResetSharedStorageBudgetCommand = Command[ResetSharedStorageBudgetParams, Response[EmptyResponse]]
SetSharedStorageTrackingCommand = Command[SetSharedStorageTrackingParams, Response[EmptyResponse]]
SetStorageBucketTrackingCommand = Command[SetStorageBucketTrackingParams, Response[EmptyResponse]]
DeleteStorageBucketCommand = Command[DeleteStorageBucketParams, Response[EmptyResponse]]
RunBounceTrackingMitigationsCommand = Command[EmptyParams, RunBounceTrackingMitigationsResponse]
SetAttributionReportingLocalTestingModeCommand = Command[
    SetAttributionReportingLocalTestingModeParams, Response[EmptyResponse]
]
SetAttributionReportingTrackingCommand = Command[
    SetAttributionReportingTrackingParams, Response[EmptyResponse]
]
SendPendingAttributionReportsCommand = Command[EmptyParams, SendPendingAttributionReportsResponse]
GetRelatedWebsiteSetsCommand = Command[EmptyParams, GetRelatedWebsiteSetsResponse]
GetAffectedUrlsForThirdPartyCookieMetadataCommand = Command[
    GetAffectedUrlsForThirdPartyCookieMetadataParams,
    GetAffectedUrlsForThirdPartyCookieMetadataResponse,
]
SetProtectedAudienceKAnonymityCommand = Command[
    SetProtectedAudienceKAnonymityParams, Response[EmptyResponse]
]


================================================
FILE: pydoll/protocol/storage/types.py
================================================
from enum import Enum

from typing_extensions import NotRequired, TypedDict

from pydoll.protocol.network.types import TimeSinceEpoch
from pydoll.protocol.target.types import TargetID

SerializedStorageKey = str
InterestGroupAuctionId = str


class StorageType(str, Enum):
    COOKIES = 'cookies'
    FILE_SYSTEMS = 'file_systems'
    INDEXEDDB = 'indexeddb'
    LOCAL_STORAGE = 'local_storage'
    SHADER_CACHE = 'shader_cache'
    WEBSQL = 'websql'
    SERVICE_WORKERS = 'service_workers'
    CACHE_STORAGE = 'cache_storage'
    INTEREST_GROUPS = 'interest_groups'
    SHARED_STORAGE = 'shared_storage'
    STORAGE_BUCKETS = 'storage_buckets'
    ALL = 'all'
    OTHER = 'other'


class UsageForType(TypedDict):
    """Usage for a storage type."""

    storageType: StorageType
    usage: float


class TrustTokens(TypedDict):
    """Pair of issuer origin and number of available (signed, but not used) Trust
    Tokens from that issuer."""

    issuerOrigin: str
    count: float


class InterestGroupAccessType(str, Enum):
    """Enum of interest group access types."""

    JOIN = 'join'
    LEAVE = 'leave'
    UPDATE = 'update'
    LOADED = 'loaded'
    BID = 'bid'
    WIN = 'win'
    ADDITIONAL_BID = 'additionalBid'
    ADDITIONAL_BID_WIN = 'additionalBidWin'
    TOP_LEVEL_BID = 'topLevelBid'
    TOP_LEVEL_ADDITIONAL_BID = 'topLevelAdditionalBid'
    CLEAR = 'clear'


class InterestGroupAuctionEventType(str, Enum):
    """Enum of auction events."""

    STARTED = 'started'
    CONFIG_RESOLVED = 'configResolved'


class InterestGroupAuctionFetchType(str, Enum):
    """Enum of network fetches auctions can do."""

    BIDDER_JS = 'bidderJs'
    BIDDER_WASM = 'bidderWasm'
    SELLER_JS = 'sellerJs'
    BIDDER_TRUSTED_SIGNALS = 'bidderTrustedSignals'
    SELLER_TRUSTED_SIGNALS = 'sellerTrustedSignals'


class SharedStorageAccessScope(str, Enum):
    """Enum of shared storage access scopes."""

    WINDOW = 'window'
    SHARED_STORAGE_WORKLET = 'sharedStorageWorklet'
    PROTECTED_AUDIENCE_WORKLET = 'protectedAudienceWorklet'
    HEADER = 'header'


class SharedStorageAccessMethod(str, Enum):
    """Enum of shared storage access methods."""

    ADD_MODULE = 'addModule'
    CREATE_WORKLET = 'createWorklet'
    SELECT_URL = 'selectURL'
    RUN = 'run'
    BATCH_UPDATE = 'batchUpdate'
    SET = 'set'
    APPEND = 'append'
    DELETE = 'delete'
    CLEAR = 'clear'
    GET = 'get'
    KEYS = 'keys'
    VALUES = 'values'
    ENTRIES = 'entries'
    LENGTH = 'length'
    REMAINING_BUDGET = 'remainingBudget'


class SharedStorageEntry(TypedDict):
    """Struct for a single key-value pair in an origin's shared storage."""

    key: str
    value: str


class SharedStorageMetadata(TypedDict):
    """Details for an origin's shared storage."""

    creationTime: TimeSinceEpoch
    length: int
    remainingBudget: float
    bytesUsed: int


class SharedStoragePrivateAggregationConfig(TypedDict):
    """Represents a dictionary object passed in as privateAggregationConfig to
    run or selectURL."""

    filteringIdMaxBytes: int
    aggregationCoordinatorOrigin: NotRequired[str]
    contextId: NotRequired[str]
    maxContributions: NotRequired[int]


class SharedStorageReportingMetadata(TypedDict):
    """Pair of reporting metadata details for a candidate URL for `selectURL()`."""

    eventType: str
    reportingUrl: str


class SharedStorageUrlWithMetadata(TypedDict):
    """Bundles a candidate URL with its reporting metadata."""

    url: str
    reportingMetadata: list[SharedStorageReportingMetadata]


class SharedStorageAccessParams(TypedDict, total=False):
    """Bundles the parameters for shared storage access events whose
    presence/absence can vary according to SharedStorageAccessType."""

    scriptSourceUrl: str
    dataOrigin: str
    operationName: str
    operationId: str
    keepAlive: bool
    privateAggregationConfig: SharedStoragePrivateAggregationConfig
    serializedData: str
    urlsWithMetadata: list[SharedStorageUrlWithMetadata]
    urnUuid: str
    key: str
    value: str
    ignoreIfPresent: bool
    workletOrdinal: int
    workletTargetId: TargetID
    withLock: str
    batchUpdateId: str
    batchSize: int


class StorageBucketsDurability(str, Enum):
    RELAXED = 'relaxed'
    STRICT = 'strict'


class StorageBucket(TypedDict):
    storageKey: SerializedStorageKey
    name: NotRequired[str]


class StorageBucketInfo(TypedDict):
    bucket: StorageBucket
    id: str
    expiration: TimeSinceEpoch
    quota: float
    persistent: bool
    durability: StorageBucketsDurability


class AttributionReportingSourceType(str, Enum):
    NAVIGATION = 'navigation'
    EVENT = 'event'


UnsignedInt64AsBase10 = str
UnsignedInt128AsBase16 = str
SignedInt64AsBase10 = str


class AttributionReportingFilterDataEntry(TypedDict):
    key: str
    values: list[str]


class AttributionReportingFilterConfig(TypedDict):
    filterValues: list[AttributionReportingFilterDataEntry]
    lookbackWindow: NotRequired[int]


class AttributionReportingFilterPair(TypedDict):
    filters: list[AttributionReportingFilterConfig]
    notFilters: list[AttributionReportingFilterConfig]


class AttributionReportingAggregationKeysEntry(TypedDict):
    key: str
    value: UnsignedInt128AsBase16


class AttributionReportingEventReportWindows(TypedDict):
    start: int
    ends: list[int]


class AttributionReportingTriggerDataMatching(str, Enum):
    EXACT = 'exact'
    MODULUS = 'modulus'


class AttributionReportingAggregatableDebugReportingData(TypedDict):
    keyPiece: UnsignedInt128AsBase16
    value: float
    types: list[str]


class AttributionReportingAggregatableDebugReportingConfig(TypedDict):
    keyPiece: UnsignedInt128AsBase16
    debugData: list[AttributionReportingAggregatableDebugReportingData]
    budget: NotRequired[float]
    aggregationCoordinatorOrigin: NotRequired[str]


class AttributionScopesData(TypedDict):
    values: list[str]
    limit: float
    maxEventStates: float


class AttributionReportingNamedBudgetDef(TypedDict):
    name: str
    budget: int


class AttributionReportingSourceRegistration(TypedDict):
    time: TimeSinceEpoch
    expiry: int
    triggerData: list[float]
    eventReportWindows: AttributionReportingEventReportWindows
    aggregatableReportWindow: int
    type: AttributionReportingSourceType
    sourceOrigin: str
    reportingOrigin: str
    destinationSites: list[str]
    eventId: UnsignedInt64AsBase10
    priority: SignedInt64AsBase10
    filterData: list[AttributionReportingFilterDataEntry]
    aggregationKeys: list[AttributionReportingAggregationKeysEntry]
    triggerDataMatching: AttributionReportingTriggerDataMatching
    destinationLimitPriority: SignedInt64AsBase10
    aggregatableDebugReportingConfig: AttributionReportingAggregatableDebugReportingConfig
    maxEventLevelReports: int
    namedBudgets: list[AttributionReportingNamedBudgetDef]
    debugReporting: bool
    eventLevelEpsilon: float
    debugKey: NotRequired[UnsignedInt64AsBase10]
    scopesData: NotRequired[AttributionScopesData]


class AttributionReportingSourceRegistrationResult(str, Enum):
    SUCCESS = 'success'
    INTERNAL_ERROR = 'internalError'
    INSUFFICIENT_SOURCE_CAPACITY = 'insufficientSourceCapacity'
    INSUFFICIENT_UNIQUE_DESTINATION_CAPACITY = 'insufficientUniqueDestinationCapacity'
    EXCESSIVE_REPORTING_ORIGINS = 'excessiveReportingOrigins'
    PROHIBITED_BY_BROWSER_POLICY = 'prohibitedByBrowserPolicy'
    SUCCESS_NOISED = 'successNoised'
    DESTINATION_REPORTING_LIMIT_REACHED = 'destinationReportingLimitReached'
    DESTINATION_GLOBAL_LIMIT_REACHED = 'destinationGlobalLimitReached'
    DESTINATION_BOTH_LIMITS_REACHED = 'destinationBothLimitsReached'
    REPORTING_ORIGINS_PER_SITE_LIMIT_REACHED = 'reportingOriginsPerSiteLimitReached'
    EXCEEDS_MAX_CHANNEL_CAPACITY = 'exceedsMaxChannelCapacity'
    EXCEEDS_MAX_SCOPES_CHANNEL_CAPACITY = 'exceedsMaxScopesChannelCapacity'
    EXCEEDS_MAX_TRIGGER_STATE_CARDINALITY = 'exceedsMaxTriggerStateCardinality'
    EXCEEDS_MAX_EVENT_STATES_LIMIT = 'exceedsMaxEventStatesLimit'
    DESTINATION_PER_DAY_REPORTING_LIMIT_REACHED = 'destinationPerDayReportingLimitReached'


class AttributionReportingSourceRegistrationTimeConfig(str, Enum):
    INCLUDE = 'include'
    EXCLUDE = 'exclude'


class AttributionReportingAggregatableValueDictEntry(TypedDict):
    key: str
    value: float
    filteringId: UnsignedInt64AsBase10


class AttributionReportingAggregatableValueEntry(TypedDict):
    values: list[AttributionReportingAggregatableValueDictEntry]
    filters: AttributionReportingFilterPair


class AttributionReportingEventTriggerData(TypedDict):
    data: UnsignedInt64AsBase10
    priority: SignedInt64AsBase10
    filters: AttributionReportingFilterPair
    dedupKey: NotRequired[UnsignedInt64AsBase10]


class AttributionReportingAggregatableTriggerData(TypedDict):
    keyPiece: UnsignedInt128AsBase16
    sourceKeys: list[str]
    filters: AttributionReportingFilterPair


class AttributionReportingAggregatableDedupKey(TypedDict):
    filters: AttributionReportingFilterPair
    dedupKey: NotRequired[UnsignedInt64AsBase10]


class AttributionReportingNamedBudgetCandidate(TypedDict):
    filters: AttributionReportingFilterPair
    name: NotRequired[str]


class AttributionReportingTriggerRegistration(TypedDict):
    filters: AttributionReportingFilterPair
    aggregatableDedupKeys: list[AttributionReportingAggregatableDedupKey]
    eventTriggerData: list[AttributionReportingEventTriggerData]
    aggregatableTriggerData: list[AttributionReportingAggregatableTriggerData]
    aggregatableValues: list[AttributionReportingAggregatableValueEntry]
    aggregatableFilteringIdMaxBytes: int
    debugReporting: bool
    sourceRegistrationTimeConfig: AttributionReportingSourceRegistrationTimeConfig
    aggregatableDebugReportingConfig: AttributionReportingAggregatableDebugReportingConfig
    scopes: list[str]
    namedBudgets: list[AttributionReportingNamedBudgetCandidate]
    debugKey: NotRequired[UnsignedInt64AsBase10]
    aggregationCoordinatorOrigin: NotRequired[str]
    triggerContextId: NotRequired[str]


class AttributionReportingEventLevelResult(str, Enum):
    SUCCESS = 'success'
    SUCCESS_DROPPED_LOWER_PRIORITY = 'successDroppedLowerPriority'
    INTERNAL_ERROR = 'internalError'
    NO_CAPACITY_FOR_ATTRIBUTION_DESTINATION = 'noCapacityForAttributionDestination'
    NO_MATCHING_SOURCES = 'noMatchingSources'
    DEDUPLICATED = 'deduplicated'
    EXCESSIVE_ATTRIBUTIONS = 'excessiveAttributions'
    PRIORITY_TOO_LOW = 'priorityTooLow'
    NEVER_ATTRIBUTED_SOURCE = 'neverAttributedSource'
    EXCESSIVE_REPORTING_ORIGINS = 'excessiveReportingOrigins'
    NO_MATCHING_SOURCE_FILTER_DATA = 'noMatchingSourceFilterData'
    PROHIBITED_BY_BROWSER_POLICY = 'prohibitedByBrowserPolicy'
    NO_MATCHING_CONFIGURATIONS = 'noMatchingConfigurations'
    EXCESSIVE_REPORTS = 'excessiveReports'
    FALSELY_ATTRIBUTED_SOURCE = 'falselyAttributedSource'
    REPORT_WINDOW_PASSED = 'reportWindowPassed'
    NOT_REGISTERED = 'notRegistered'
    REPORT_WINDOW_NOT_STARTED = 'reportWindowNotStarted'
    NO_MATCHING_TRIGGER_DATA = 'noMatchingTriggerData'


class AttributionReportingAggregatableResult(str, Enum):
    SUCCESS = 'success'
    INTERNAL_ERROR = 'internalError'
    NO_CAPACITY_FOR_ATTRIBUTION_DESTINATION = 'noCapacityForAttributionDestination'
    NO_MATCHING_SOURCES = 'noMatchingSources'
    EXCESSIVE_ATTRIBUTIONS = 'excessiveAttributions'
    EXCESSIVE_REPORTING_ORIGINS = 'excessiveReportingOrigins'
    NO_HISTOGRAMS = 'noHistograms'
    INSUFFICIENT_BUDGET = 'insufficientBudget'
    INSUFFICIENT_NAMED_BUDGET = 'insufficientNamedBudget'
    NO_MATCHING_SOURCE_FILTER_DATA = 'noMatchingSourceFilterData'
    NOT_REGISTERED = 'notRegistered'
    PROHIBITED_BY_BROWSER_POLICY = 'prohibitedByBrowserPolicy'
    DEDUPLICATED = 'deduplicated'
    REPORT_WINDOW_PASSED = 'reportWindowPassed'
    EXCESSIVE_REPORTS = 'excessiveReports'


class AttributionReportingReportResult(str, Enum):
    SENT = 'sent'
    PROHIBITED = 'prohibited'
    FAILED_TO_ASSEMBLE = 'failedToAssemble'
    EXPIRED = 'expired'


class RelatedWebsiteSet(TypedDict):
    primarySites: list[str]
    associatedSites: list[str]
    serviceSites: list[str]


================================================
FILE: pydoll/protocol/target/__init__.py
================================================
"""Target domain implementation."""


================================================
FILE: pydoll/protocol/target/events.py
================================================
from enum import Enum

from typing_extensions import NotRequired, TypedDict

from pydoll.protocol.base import CDPEvent
from pydoll.protocol.target.types import SessionID, TargetID, TargetInfo


class TargetEvent(str, Enum):
    """
    Events from the Target domain of the Chrome DevTools Protocol.

    This enumeration contains the names of Target-related events that can be
    received from the Chrome DevTools Protocol. These events provide information
    about target creation, destruction, and communication between targets.
    """

    RECEIVED_MESSAGE_FROM_TARGET = 'Target.receivedMessageFromTarget'
    """
    Notifies about a new protocol message received from the session
    (as reported in attachedToTarget event).

    Args:
        sessionId (SessionID): Identifier of a session which sends a message.
        message (str): The message content.
        targetId (TargetID): Deprecated.
    """

    TARGET_CRASHED = 'Target.targetCrashed'
    """
    Issued when a target has crashed.

    Args:
        targetId (TargetID): Identifier of the crashed target.
        status (str): Termination status type.
        errorCode (int): Termination error code.
    """

    TARGET_CREATED = 'Target.targetCreated'
    """
    Issued when a possible inspection target is created.

    Args:
        targetInfo (TargetInfo): Information about the created target.
    """

    TARGET_DESTROYED = 'Target.targetDestroyed'
    """
    Issued when a target is destroyed.

    Args:
        targetId (TargetID): Identifier of the destroyed target.
    """

    TARGET_INFO_CHANGED = 'Target.targetInfoChanged'
    """
    Issued when some information about a target has changed.
    This only happens between targetCreated and targetDestroyed.

    Args:
        targetInfo (TargetInfo): Updated information about the target.
    """

    ATTACHED_TO_TARGET = 'Target.attachedToTarget'
    """
    Issued when attached to target because of auto-attach or attachToTarget command.

    Args:
        sessionId (SessionID): Identifier assigned to the session used to send/receive messages.
        targetInfo (TargetInfo): Information about the target.
        waitingForDebugger (bool): Whether the target is waiting for debugger to attach.
    """

    DETACHED_FROM_TARGET = 'Target.detachedFromTarget'
    """
    Issued when detached from target for any reason (including detachFromTarget command).
    Can be issued multiple times per target if multiple sessions have been attached to it.

    Args:
        sessionId (SessionID): Detached session identifier.
        targetId (TargetID): Deprecated.
    """


class AttachedToTargetParams(TypedDict):
    """Parameters for the `attachedToTarget` event."""

    sessionId: SessionID
    targetInfo: TargetInfo
    waitingForDebugger: bool


class DetachedFromTargetParams(TypedDict):
    """Parameters for the `detachedFromTarget` event."""

    sessionId: SessionID
    targetId: NotRequired[TargetID]


class ReceivedMessageFromTargetParams(TypedDict):
    """Parameters for the `receivedMessageFromTarget` event."""

    sessionId: SessionID
    message: str
    targetId: NotRequired[TargetID]


class TargetCreatedParams(TypedDict):
    """Parameters for the `targetCreated` event."""

    targetInfo: TargetInfo


class TargetDestroyedParams(TypedDict):
    """Parameters for the `targetDestroyed` event."""

    targetId: TargetID


class TargetCrashedParams(TypedDict):
    """Parameters for the `targetCrashed` event."""

    targetId: TargetID
    status: str
    errorCode: int


class TargetInfoChangedParams(TypedDict):
    """Parameters for the `targetInfoChanged` event."""

    targetInfo: TargetInfo


AttachedToTargetEvent = CDPEvent[AttachedToTargetParams]
DetachedFromTargetEvent = CDPEvent[DetachedFromTargetParams]
ReceivedMessageFromTargetEvent = CDPEvent[ReceivedMessageFromTargetParams]
TargetCreatedEvent = CDPEvent[TargetCreatedParams]
TargetDestroyedEvent = CDPEvent[TargetDestroyedParams]
TargetCrashedEvent = CDPEvent[TargetCrashedParams]
TargetInfoChangedEvent = CDPEvent[TargetInfoChangedParams]


================================================
FILE: pydoll/protocol/target/methods.py
================================================
from enum import Enum

from typing_extensions import NotRequired, TypedDict

from pydoll.protocol.base import Command, EmptyParams, EmptyResponse, Response
from pydoll.protocol.browser.types import BrowserContextID, WindowState
from pydoll.protocol.target.types import (
    RemoteLocation,
    SessionID,
    TargetFilter,
    TargetID,
    TargetInfo,
)


class TargetMethod(str, Enum):
    """Target domain method names."""

    ACTIVATE_TARGET = 'Target.activateTarget'
    ATTACH_TO_TARGET = 'Target.attachToTarget'
    ATTACH_TO_BROWSER_TARGET = 'Target.attachToBrowserTarget'
    CLOSE_TARGET = 'Target.closeTarget'
    EXPOSE_DEV_TOOLS_PROTOCOL = 'Target.exposeDevToolsProtocol'
    CREATE_BROWSER_CONTEXT = 'Target.createBrowserContext'
    GET_BROWSER_CONTEXTS = 'Target.getBrowserContexts'
    CREATE_TARGET = 'Target.createTarget'
    DETACH_FROM_TARGET = 'Target.detachFromTarget'
    DISPOSE_BROWSER_CONTEXT = 'Target.disposeBrowserContext'
    GET_TARGET_INFO = 'Target.getTargetInfo'
    GET_TARGETS = 'Target.getTargets'
    SEND_MESSAGE_TO_TARGET = 'Target.sendMessageToTarget'
    SET_AUTO_ATTACH = 'Target.setAutoAttach'
    AUTO_ATTACH_RELATED = 'Target.autoAttachRelated'
    SET_DISCOVER_TARGETS = 'Target.setDiscoverTargets'
    SET_REMOTE_LOCATIONS = 'Target.setRemoteLocations'
    OPEN_DEV_TOOLS = 'Target.openDevTools'


# Parameter types
class ActivateTargetParams(TypedDict):
    """Parameters for the activateTarget command."""

    targetId: TargetID


class AttachToTargetParams(TypedDict):
    """Parameters for the attachToTarget command."""

    targetId: TargetID
    flatten: NotRequired[bool]


class AttachToBrowserTargetParams(TypedDict):
    """Parameters for the attachToBrowserTarget command."""

    sessionId: SessionID


class CloseTargetParams(TypedDict):
    """Parameters for the closeTarget command."""

    targetId: TargetID


class ExposeDevToolsProtocolParams(TypedDict):
    """Parameters for the exposeDevToolsProtocol command."""

    targetId: TargetID
    bindingName: NotRequired[str]
    inheritPermissions: NotRequired[bool]


class CreateBrowserContextParams(TypedDict):
    """Parameters for the createBrowserContext command."""

    disposeOnDetach: NotRequired[bool]
    proxyServer: NotRequired[str]
    proxyBypassList: NotRequired[str]
    originsWithUniversalNetworkAccess: NotRequired[list[str]]


class CreateTargetParams(TypedDict):
    """Parameters for the createTarget command."""

    url: str
    left: NotRequired[int]
    top: NotRequired[int]
    width: NotRequired[int]
    height: NotRequired[int]
    windowState: NotRequired[WindowState]
    browserContextId: NotRequired[BrowserContextID]
    enableBeginFrameControl: NotRequired[bool]
    newWindow: NotRequired[bool]
    background: NotRequired[bool]
    forTab: NotRequired[bool]
    hidden: NotRequired[bool]


class DetachFromTargetParams(TypedDict):
    """Parameters for the detachFromTarget command."""

    sessionId: NotRequired[SessionID]
    targetId: NotRequired[TargetID]


class DisposeBrowserContextParams(TypedDict):
    """Parameters for the disposeBrowserContext command."""

    browserContextId: BrowserContextID


class GetTargetInfoParams(TypedDict):
    """Parameters for the getTargetInfo command."""

    targetId: NotRequired[TargetID]


class GetTargetsParams(TypedDict):
    """Parameters for the getTargets command."""

    filter: NotRequired[TargetFilter]


class SendMessageToTargetParams(TypedDict):
    """Parameters for the sendMessageToTarget command."""

    message: str
    sessionId: NotRequired[SessionID]
    targetId: NotRequired[TargetID]


class SetAutoAttachParams(TypedDict):
    """Parameters for the setAutoAttach command."""

    autoAttach: bool
    waitForDebuggerOnStart: bool
    flatten: NotRequired[bool]
    filter: NotRequired[TargetFilter]


class AutoAttachRelatedParams(TypedDict):
    """Parameters for the autoAttachRelated command."""

    targetId: TargetID
    waitForDebuggerOnStart: bool
    filter: NotRequired[TargetFilter]


class SetDiscoverTargetsParams(TypedDict):
    """Parameters for the setDiscoverTargets command."""

    discover: bool
    filter: NotRequired[TargetFilter]


class SetRemoteLocationsParams(TypedDict):
    """Parameters for the setRemoteLocations command."""

    locations: list[RemoteLocation]


class OpenDevToolsParams(TypedDict):
    """Parameters for the openDevTools command."""

    targetId: TargetID


# Result types
class AttachToTargetResult(TypedDict):
    """Result for the attachToTarget command."""

    sessionId: SessionID


class AttachToBrowserTargetResult(TypedDict):
    """Result for the attachToBrowserTarget command."""

    sessionId: SessionID


class CloseTargetResult(TypedDict):
    """Result for the closeTarget command."""

    success: bool


class CreateBrowserContextResult(TypedDict):
    """Result for the createBrowserContext command."""

    browserContextId: BrowserContextID


class GetBrowserContextsResult(TypedDict):
    """Result for the getBrowserContexts command."""

    browserContextIds: list[BrowserContextID]


class CreateTargetResult(TypedDict):
    """Result for the createTarget command."""

    targetId: TargetID


class GetTargetInfoResult(TypedDict):
    """Result for the getTargetInfo command."""

    targetInfo: TargetInfo


class GetTargetsResult(TypedDict):
    """Result for the getTargets command."""

    targetInfos: list[TargetInfo]


class OpenDevToolsResult(TypedDict):
    """Result for the openDevTools command."""

    targetId: TargetID


# Response types
AttachToTargetResponse = Response[AttachToTargetResult]
AttachToBrowserTargetResponse = Response[AttachToBrowserTargetResult]
CloseTargetResponse = Response[CloseTargetResult]
CreateBrowserContextResponse = Response[CreateBrowserContextResult]
GetBrowserContextsResponse = Response[GetBrowserContextsResult]
CreateTargetResponse = Response[CreateTargetResult]
GetTargetInfoResponse = Response[GetTargetInfoResult]
GetTargetsResponse = Response[GetTargetsResult]
OpenDevToolsResponse = Response[OpenDevToolsResult]


# Command types
ActivateTargetCommand = Command[ActivateTargetParams, Response[EmptyResponse]]
AttachToTargetCommand = Command[AttachToTargetParams, AttachToTargetResponse]
AttachToBrowserTargetCommand = Command[EmptyParams, AttachToBrowserTargetResponse]
CloseTargetCommand = Command[CloseTargetParams, CloseTargetResponse]
ExposeDevToolsProtocolCommand = Command[ExposeDevToolsProtocolParams, Response[EmptyResponse]]
CreateBrowserContextCommand = Command[CreateBrowserContextParams, CreateBrowserContextResponse]
GetBrowserContextsCommand = Command[EmptyParams, GetBrowserContextsResponse]
CreateTargetCommand = Command[CreateTargetParams, CreateTargetResponse]
DetachFromTargetCommand = Command[DetachFromTargetParams, Response[EmptyResponse]]
DisposeBrowserContextCommand = Command[DisposeBrowserContextParams, Response[EmptyResponse]]
GetTargetInfoCommand = Command[GetTargetInfoParams, GetTargetInfoResponse]
GetTargetsCommand = Command[GetTargetsParams, GetTargetsResponse]
SendMessageToTargetCommand = Command[SendMessageToTargetParams, Response[EmptyResponse]]
SetAutoAttachCommand = Command[SetAutoAttachParams, Response[EmptyResponse]]
AutoAttachRelatedCommand = Command[AutoAttachRelatedParams, Response[EmptyResponse]]
SetDiscoverTargetsCommand = Command[SetDiscoverTargetsParams, Response[EmptyResponse]]
SetRemoteLocationsCommand = Command[SetRemoteLocationsParams, Response[EmptyResponse]]
OpenDevToolsCommand = Command[OpenDevToolsParams, OpenDevToolsResponse]


================================================
FILE: pydoll/protocol/target/types.py
================================================
from typing_extensions import NotRequired, TypedDict

from pydoll.protocol.browser.types import BrowserContextID
from pydoll.protocol.page.types import FrameId

TargetID = str
SessionID = str


class TargetInfo(TypedDict):
    targetId: TargetID
    type: str
    title: str
    url: str
    attached: bool
    openerId: NotRequired[TargetID]
    canAccessOpener: NotRequired[bool]
    openerFrameId: NotRequired[FrameId]
    browserContextId: NotRequired[BrowserContextID]
    subtype: NotRequired[str]


class FilterEntry(TypedDict, total=False):
    """A filter used by target query/discovery/auto-attach operations."""

    exclude: bool
    type: str


TargetFilter = list[FilterEntry]


class RemoteLocation(TypedDict):
    host: str
    port: int


================================================
FILE: pydoll/py.typed
================================================


================================================
FILE: pydoll/utils/__init__.py
================================================
from pydoll.utils.general import (
    TextExtractor,
    clean_script_for_analysis,
    decode_base64_to_bytes,
    extract_text_from_html,
    get_browser_ws_address,
    has_return_outside_function,
    is_script_already_function,
    normalize_synthetic_xpath,
    validate_browser_paths,
)
from pydoll.utils.socks5_proxy_forwarder import SOCKS5Forwarder
from pydoll.utils.user_agent_parser import UserAgentParser

__all__ = [
    'TextExtractor',
    'clean_script_for_analysis',
    'decode_base64_to_bytes',
    'extract_text_from_html',
    'get_browser_ws_address',
    'has_return_outside_function',
    'is_script_already_function',
    'normalize_synthetic_xpath',
    'validate_browser_paths',
    'SOCKS5Forwarder',
    'UserAgentParser',
]


================================================
FILE: pydoll/utils/bundle.py
================================================
"""Utility functions for saving page bundles (HTML + assets as .zip)."""

from __future__ import annotations

import base64 as _b64
import posixpath
import re
from urllib.parse import urljoin, urlparse

from pydoll.protocol.network.types import ResourceType
from pydoll.protocol.page.types import FrameResource, FrameResourceTree

_BUNDLEABLE_RESOURCE_TYPES: frozenset[ResourceType] = frozenset({
    ResourceType.DOCUMENT,
    ResourceType.STYLESHEET,
    ResourceType.SCRIPT,
    ResourceType.IMAGE,
    ResourceType.FONT,
    ResourceType.MEDIA,
})

_MIME_TO_EXT: dict[str, str] = {
    'text/css': '.css',
    'text/javascript': '.js',
    'application/javascript': '.js',
    'application/x-javascript': '.js',
    'text/html': '.html',
    'text/plain': '.txt',
    'image/png': '.png',
    'image/jpeg': '.jpg',
    'image/gif': '.gif',
    'image/svg+xml': '.svg',
    'image/webp': '.webp',
    'image/x-icon': '.ico',
    'image/vnd.microsoft.icon': '.ico',
    'font/woff': '.woff',
    'font/woff2': '.woff2',
    'application/font-woff': '.woff',
    'application/font-woff2': '.woff2',
    'font/ttf': '.ttf',
    'font/otf': '.otf',
    'application/x-font-ttf': '.ttf',
    'application/x-font-otf': '.otf',
    'video/mp4': '.mp4',
    'video/webm': '.webm',
    'audio/mpeg': '.mp3',
    'audio/ogg': '.ogg',
    'application/json': '.json',
    'application/xml': '.xml',
    'text/xml': '.xml',
}

_CSS_URL_RE = re.compile(r'url\(\s*(["\']?)(.*?)\1\s*\)', re.IGNORECASE)


def filter_fetchable_resources(
    all_resources: list[tuple[str, FrameResource]],
    page_url: str,
) -> list[tuple[str, FrameResource]]:
    """Filter resources to only those that should be bundled."""
    fetchable: list[tuple[str, FrameResource]] = []
    for fid, res in all_resources:
        if res.get('failed') or res.get('canceled'):
            continue
        url = res['url']
        if url == page_url or url.startswith('data:'):
            continue
        if res['type'] not in _BUNDLEABLE_RESOURCE_TYPES:
            continue
        fetchable.append((fid, res))
    return fetchable


def collect_frame_resources(
    frame_tree: FrameResourceTree,
) -> list[tuple[str, FrameResource]]:
    """Recursively collect all resources from a frame tree."""
    frame_id = frame_tree['frame']['id']
    result: list[tuple[str, FrameResource]] = [
        (frame_id, res) for res in frame_tree.get('resources', [])
    ]
    for child in frame_tree.get('childFrames', []):
        result.extend(collect_frame_resources(child))
    return result


def build_asset_filename(url: str, mime_type: str, index: int) -> str:
    """Build a unique filename from a URL, MIME type, and index."""
    parsed = urlparse(url)
    basename = posixpath.basename(parsed.path) if parsed.path else ''
    if not basename or basename == '/':
        basename = 'resource'
    if '.' not in basename:
        ext = _MIME_TO_EXT.get(mime_type.split(';')[0].strip(), '')
        basename = f'{basename}{ext}'
    return f'{index:04d}_{basename}'


def rewrite_css_urls(
    css_text: str,
    css_url: str,
    asset_map: dict[str, tuple[str, bytes, str, ResourceType]],
) -> str:
    """Rewrite url() references in CSS to point to local asset paths."""

    def _replace(match: re.Match[str]) -> str:
        raw_url = match.group(2)
        if raw_url.startswith('data:'):
            return match.group(0)
        absolute = urljoin(css_url, raw_url)
        entry = asset_map.get(absolute)
        if entry is None:
            return match.group(0)
        filename = entry[0]
        return f'url("{filename}")'

    return _CSS_URL_RE.sub(_replace, css_text)


def inline_css_urls(
    css_text: str,
    css_url: str,
    asset_map: dict[str, tuple[str, bytes, str, ResourceType]],
) -> str:
    """Replace url() references in CSS with data URIs."""

    def _replace(match: re.Match[str]) -> str:
        raw_url = match.group(2)
        if raw_url.startswith('data:'):
            return match.group(0)
        absolute = urljoin(css_url, raw_url)
        entry = asset_map.get(absolute)
        if entry is None:
            return match.group(0)
        _fname, data, mime, _rtype = entry
        b64 = _b64.b64encode(data).decode('ascii')
        return f'url("data:{mime};base64,{b64}")'

    return _CSS_URL_RE.sub(_replace, css_text)


def replace_stylesheet_with_inline(html: str, url: str, css_text: str) -> str:
    """Replace a <link> stylesheet tag with an inline <style> block."""
    escaped = re.escape(url)
    pattern = re.compile(
        rf'<link\b[^>]*href=["\']?{escaped}["\']?[^>]*/?>',
        re.IGNORECASE,
    )
    replacement = f'<style>{css_text}</style>'
    return pattern.sub(lambda _: replacement, html, count=1)


def replace_script_with_inline(html: str, url: str, js_text: str) -> str:
    """Replace a <script src=...> tag with an inline <script> block."""
    escaped = re.escape(url)
    pattern = re.compile(
        rf'<script\b[^>]*src=["\']?{escaped}["\']?[^>]*>\s*</script>',
        re.IGNORECASE,
    )
    safe_js = js_text.replace('</script>', '<\\/script>')
    replacement = f'<script>{safe_js}</script>'
    return pattern.sub(lambda _: replacement, html, count=1)


def rewrite_html_urls(
    html: str,
    asset_map: dict[str, tuple[str, bytes, str, ResourceType]],
) -> str:
    """Rewrite asset URLs in HTML to point to local assets/ directory."""
    for url, (filename, data, mime, rtype) in asset_map.items():
        if rtype == ResourceType.STYLESHEET:
            css_text = data.decode('utf-8', errors='replace')
            rewritten_css = rewrite_css_urls(css_text, url, asset_map)
            asset_map[url] = (filename, rewritten_css.encode('utf-8'), mime, rtype)
        html = html.replace(url, f'assets/{filename}')
    return html


def inline_all_assets(
    html: str,
    asset_map: dict[str, tuple[str, bytes, str, ResourceType]],
) -> str:
    """Embed all assets inline into the HTML."""
    for url, (_, data, mime, rtype) in asset_map.items():
        if rtype == ResourceType.STYLESHEET:
            css_text = data.decode('utf-8', errors='replace')
            css_text = inline_css_urls(css_text, url, asset_map)
            html = replace_stylesheet_with_inline(html, url, css_text)
        elif rtype == ResourceType.SCRIPT:
            js_text = data.decode('utf-8', errors='replace')
            html = replace_script_with_inline(html, url, js_text)
        else:
            b64 = _b64.b64encode(data).decode('ascii')
            data_uri = f'data:{mime};base64,{b64}'
            html = html.replace(url, data_uri)
    return html


================================================
FILE: pydoll/utils/general.py
================================================
import base64
import logging
import os
import re
from html import unescape
from html.parser import HTMLParser

import aiohttp

from pydoll.exceptions import InvalidBrowserPath, InvalidResponse, NetworkError

logger = logging.getLogger(__name__)


class TextExtractor(HTMLParser):
    """
    HTML parser for text extraction.

    Extracts visible text content from an HTML string, excluding the contents of
    tags specified in _skip_tags.
    """

    def __init__(self):
        super().__init__()
        self._parts = []
        self._skip = False
        self._skip_tags = {'script', 'style', 'template'}

    def handle_starttag(self, tag, attrs):
        """
        Marks the parser to skip content inside tags specified in _skip_tags.

        Args:
            tag (str): The tag name.
            attrs (list): A list of (attribute, value) pairs.
        """
        if tag in self._skip_tags:
            self._skip = True

    def handle_endtag(self, tag):
        """
        Marks the parser the end of skip tags.

        Args:
            tag (str): The tag name.
        """
        if tag in self._skip_tags:
            self._skip = False

    def handle_data(self, data):
        """
        Handles text nodes. Adds them to the result unless they are within a skip tag.

        Args:
            data (str): The text data.
        """
        if not self._skip:
            self._parts.append(unescape(data))

    def get_strings(self, strip: bool):
        """
        Yields all collected visible text fragments.

        Args:
            strip (bool): Whether to strip leading/trailing whitespace from each fragment.

        Yields:
            str: Visible text fragments.
        """
        for text in self._parts:
            yield text.strip() if strip else text

    def get_text(self, separator: str, strip: bool) -> str:
        """
        Returns all visible text.

        Args:
            separator (str): String inserted between extracted text fragments.
            strip (bool): Whether to strip whitespace from each fragment.

        Returns:
            str: The visible text.
        """
        return separator.join(self.get_strings(strip=strip))


def extract_text_from_html(html: str, separator: str = '', strip: bool = False) -> str:
    """
    Extracts visible text content from an HTML string.

    Args:
        html (str): The HTML string to extract text from.
        separator (str, optional): String inserted between extracted text fragments. Defaults to ''.
        strip (bool, optional): Whether to strip whitespace from text fragments. Defaults to False.

    Returns:
        str: The extracted visible text.
    """
    parser = TextExtractor()
    parser.feed(html)
    return parser.get_text(separator=separator, strip=strip)


def decode_base64_to_bytes(image: str) -> bytes:
    """
    Decodes a base64 image string to bytes.

    Args:
        image (str): The base64 image string to decode.

    Returns:
        bytes: The decoded image as bytes.
    """
    return base64.b64decode(image.encode('utf-8'))


async def get_browser_ws_address(port: int) -> str:
    """
    Fetches the WebSocket address for the browser instance.

    Returns:
        str: The WebSocket address for the browser.

    Raises:
        NetworkError: If the address cannot be fetched due to network errors
            or missing data.
        InvalidResponse: If the response is not valid JSON.
    """
    try:
        async with aiohttp.ClientSession() as session:
            async with session.get(f'http://localhost:{port}/json/version') as response:
                response.raise_for_status()
                data = await response.json()
                return data['webSocketDebuggerUrl']

    except aiohttp.ClientError as e:
        raise NetworkError(f'Failed to get browser ws address: {e}')

    except KeyError as e:
        raise InvalidResponse(f'Failed to get browser ws address: {e}')


def validate_browser_paths(paths: list[str]) -> str:
    """
    Validates potential browser executable paths and returns the first valid one.

    Checks a list of possible browser binary locations to find an existing,
    executable browser. This is used by browser-specific subclasses to locate
    the browser executable when no explicit binary path is provided.

    Args:
        paths: List of potential file paths to check for the browser executable.
            These should be absolute paths appropriate for the current OS.

    Returns:
        str: The first valid browser executable path found.

    Raises:
        InvalidBrowserPath: If the browser executable is not found at the path.
    """
    for path in paths:
        if os.path.isfile(path) and os.access(path, os.X_OK):
            return path
    raise InvalidBrowserPath(f'No valid browser path found in: {paths}')


def clean_script_for_analysis(script: str) -> str:
    """
    Clean JavaScript code by removing comments and string literals.

    This helps avoid false positives when analyzing script structure.

    Args:
        script: JavaScript code to clean.

    Returns:
        str: Cleaned script with comments and strings removed.
    """
    # Remove line comments
    cleaned = re.sub(r'//.*?$', '', script, flags=re.MULTILINE)
    # Remove block comments
    cleaned = re.sub(r'/\*.*?\*/', '', cleaned, flags=re.DOTALL)
    # Remove double quoted strings
    cleaned = re.sub(r'"[^"]*"', '""', cleaned)
    # Remove single quoted strings
    cleaned = re.sub(r"'[^']*'", "''", cleaned)
    # Remove template literals
    cleaned = re.sub(r'`[^`]*`', '``', cleaned)

    return cleaned


def is_script_already_function(script: str) -> bool:
    """
    Check if a JavaScript script is already wrapped in a function.

    Args:
        script: JavaScript code to analyze.

    Returns:
        bool: True if script is already a function, False otherwise.
    """
    cleaned_script = clean_script_for_analysis(script)

    function_pattern = r'^\s*function\s*\([^)]*\)\s*\{'
    arrow_function_pattern = r'^\s*\([^)]*\)\s*=>\s*\{'

    return bool(
        re.match(function_pattern, cleaned_script.strip())
        or re.match(arrow_function_pattern, cleaned_script.strip())
    )


def has_return_outside_function(script: str) -> bool:
    """
    Check if a JavaScript script has return statements outside of functions.

    Args:
        script: JavaScript code to analyze.

    Returns:
        bool: True if script has return outside function, False otherwise.
    """
    cleaned_script = clean_script_for_analysis(script)

    # If already a function, no need to check
    if is_script_already_function(cleaned_script):
        return False

    # Look for 'return' statements
    return_pattern = r'\breturn\b'
    if not re.search(return_pattern, cleaned_script):
        return False

    # Check if return is inside a function by counting braces
    lines = cleaned_script.split('\n')
    brace_count = 0
    in_function = False

    for line in lines:
        # Check for function declarations
        if re.search(r'\bfunction\b', line) or re.search(r'=>', line):
            in_function = True

        # Count braces
        brace_count += line.count('{') - line.count('}')

        # Check for return statement
        if re.search(return_pattern, line):
            if not in_function or brace_count <= 0:
                return True

        # Reset function flag if we're back to top level
        if brace_count <= 0:
            in_function = False

    return False


def normalize_synthetic_xpath(selector: str) -> str:
    """
    Normalize synthetic XPath selector produced by the builder.

    Converts selectors of the form //*[@xpath="..."] back into the original
    XPath string between the quotes. Returns the input unchanged if the
    pattern is not present or cannot be parsed safely.

    Args:
        selector: The selector string that may contain the synthetic XPath format.

    Returns:
        str: The normalized original XPath or the input selector if no normalization applies.
    """
    s = selector.strip()
    if not s.startswith('//*[@xpath='):
        return selector
    prefix = '//*[@xpath="'
    start_idx = s.find(prefix)
    if start_idx == -1:
        return selector
    start_idx += len(prefix)
    end_idx = s.rfind('"]')
    if end_idx == -1 or end_idx <= start_idx:
        return selector
    return s[start_idx:end_idx]


================================================
FILE: pydoll/utils/socks5_proxy_forwarder.py
================================================
"""
SOCKS5 Proxy Forwarder — Local no-auth proxy that forwards to a remote
authenticated SOCKS5 proxy.

Chrome/Chromium does NOT support SOCKS5 authentication natively
(Chromium issue #40323993). This module works around that limitation by
running a lightweight local SOCKS5 proxy (no authentication required)
that performs the SOCKS5 handshake with username/password on behalf of
the browser.

Data flow:
    Chrome ──► localhost:{local_port} (no auth)
                    │
              SOCKS5Forwarder
                    │  (authenticates with remote)
                    ▼
           remote_host:remote_port (user/pass auth)
                    │
                    ▼
              destination server

Usage as CLI:
    python -m pydoll.utils.socks5_proxy_forwarder \\
        --remote-host proxy.example.com \\
        --remote-port 1080 \\
        --username myuser \\
        --password mypass \\
        --local-port 1081

Usage with Pydoll:
    import asyncio
    from pydoll.utils import SOCKS5Forwarder
    from pydoll.browser.chromium import Chrome
    from pydoll.browser.options import ChromiumOptions

    async def main():
        forwarder = SOCKS5Forwarder(
            remote_host='proxy.example.com',
            remote_port=1080,
            username='myuser',
            password='mypass',
            local_port=1081,
        )
        async with forwarder:
            options = ChromiumOptions()
            options.add_argument('--proxy-server=socks5://127.0.0.1:1081')
            async with Chrome(options=options) as browser:
                tab = await browser.start()
                await tab.go_to('https://httpbin.org/ip')

    asyncio.run(main())

Requirements: Python >= 3.10, no external dependencies.
"""

from __future__ import annotations

import argparse
import asyncio
import ipaddress
import logging
import signal
import struct
from types import TracebackType

logger = logging.getLogger(__name__)

SOCKS5_VERSION = 0x05
AUTH_NO_AUTH = 0x00
AUTH_USERNAME_PASSWORD = 0x02
AUTH_NO_ACCEPTABLE = 0xFF

CMD_CONNECT = 0x01

ATYP_IPV4 = 0x01
ATYP_DOMAIN = 0x03
ATYP_IPV6 = 0x04

REPLY_SUCCESS = 0x00
REPLY_GENERAL_FAILURE = 0x01
REPLY_CONNECTION_REFUSED = 0x05
REPLY_COMMAND_NOT_SUPPORTED = 0x07
REPLY_ADDRESS_TYPE_NOT_SUPPORTED = 0x08

BUFFER_SIZE = 65536
HANDSHAKE_TIMEOUT = 30
MAX_CREDENTIAL_BYTES = 255


class _suppress_closed:
    """Tiny context manager that silences errors on already-closed transports."""

    def __enter__(self) -> None:
        return None

    def __exit__(
        self,
        exc_type: type[BaseException] | None,
        exc_val: BaseException | None,
        exc_tb: TracebackType | None,
    ) -> bool:
        return exc_type is not None and issubclass(exc_type, OSError)


async def _close_writer(writer: asyncio.StreamWriter) -> None:
    """Close a stream writer and wait for the transport to finish."""
    with _suppress_closed():
        writer.close()
        await writer.wait_closed()


async def _pipe(
    reader: asyncio.StreamReader,
    writer: asyncio.StreamWriter,
    label: str,
) -> None:
    """Forward data from *reader* to *writer* until EOF."""
    try:
        while True:
            data = await reader.read(BUFFER_SIZE)
            if not data:
                break
            writer.write(data)
            await writer.drain()
    except (ConnectionResetError, BrokenPipeError, OSError):
        pass
    finally:
        await _close_writer(writer)


class SOCKS5Forwarder:
    """Local SOCKS5 proxy (no auth) that forwards to a remote authenticated
    SOCKS5 proxy.

    Can be used as an async context manager::

        async with SOCKS5Forwarder(...) as fwd:
            # fwd.local_port is now listening
            ...
    """

    def __init__(
        self,
        remote_host: str,
        remote_port: int,
        username: str,
        password: str,
        local_host: str = '127.0.0.1',
        local_port: int = 0,
    ) -> None:
        if len(username.encode()) > MAX_CREDENTIAL_BYTES:
            raise ValueError('SOCKS5 username must be at most 255 bytes (UTF-8 encoded)')
        if len(password.encode()) > MAX_CREDENTIAL_BYTES:
            raise ValueError('SOCKS5 password must be at most 255 bytes (UTF-8 encoded)')
        self.remote_host = remote_host
        self.remote_port = remote_port
        self.username = username
        self.password = password
        self.local_host = local_host
        self.local_port = local_port
        self._server: asyncio.Server | None = None

    async def __aenter__(self) -> SOCKS5Forwarder:
        await self.start()
        return self

    async def __aexit__(
        self,
        exc_type: type[BaseException] | None,
        exc_val: BaseException | None,
        exc_tb: TracebackType | None,
    ) -> None:
        await self.stop()

    async def start(self) -> None:
        """Start accepting connections on *local_host*:*local_port*."""
        try:
            addr = ipaddress.ip_address(self.local_host)
        except ValueError:
            addr = None

        if addr is not None and not addr.is_loopback:
            logger.warning(
                'Binding to non-loopback address %s — the forwarder will be '
                'accessible from the network without authentication!',
                self.local_host,
            )
        elif addr is None and self.local_host != 'localhost':
            logger.debug(
                'local_host=%r is not an IP literal; skipping loopback check',
                self.local_host,
            )
        self._server = await asyncio.start_server(
            self._handle_client,
            self.local_host,
            self.local_port,
        )
        sockets = list(self._server.sockets or [])
        ports = {s.getsockname()[1] for s in sockets}
        if len(ports) != 1:
            await self.stop()
            raise RuntimeError(
                f'start_server created sockets with different ports: {sorted(ports)}. '
                "Use an explicit IP (e.g. '127.0.0.1' or '::1') instead of a hostname, "
                'or specify --local-port explicitly.'
            )
        self.local_port = ports.pop()
        logger.info(
            'SOCKS5 forwarder listening on %s:%s -> %s:%s',
            self.local_host,
            self.local_port,
            self.remote_host,
            self.remote_port,
        )

    async def stop(self) -> None:
        """Gracefully shut down the server."""
        if self._server is not None:
            self._server.close()
            await self._server.wait_closed()
            self._server = None
            logger.info('SOCKS5 forwarder stopped')

    async def serve_forever(self) -> None:
        """Block until the server is closed (useful for CLI mode)."""
        if self._server is None:
            raise RuntimeError('Server not started — call start() first')
        async with self._server:
            await self._server.serve_forever()

    async def _handle_client(
        self,
        client_reader: asyncio.StreamReader,
        client_writer: asyncio.StreamWriter,
    ) -> None:
        """Handle one incoming browser connection."""
        remote_writer: asyncio.StreamWriter | None = None
        try:
            addr_payload, dest_port = await self._accept_local_handshake(
                client_reader,
                client_writer,
            )
            r_reader, r_writer = await asyncio.wait_for(
                asyncio.open_connection(self.remote_host, self.remote_port),
                timeout=HANDSHAKE_TIMEOUT,
            )
            remote_writer = r_writer
            await self._remote_handshake(
                r_reader,
                r_writer,
                addr_payload,
                dest_port,
            )
            await self._send_reply(client_writer, REPLY_SUCCESS)
            await asyncio.gather(
                _pipe(client_reader, r_writer, 'client->remote'),
                _pipe(r_reader, client_writer, 'remote->client'),
            )
        except _HandshakeError as exc:
            logger.warning('Handshake failed: %s', exc)
            if exc.send_reply:
                with _suppress_closed():
                    await self._send_reply(client_writer, exc.reply_code)
        except asyncio.TimeoutError:
            logger.warning('Connection to remote proxy timed out')
            with _suppress_closed():
                await self._send_reply(client_writer, REPLY_GENERAL_FAILURE)
        except (ConnectionRefusedError, OSError) as exc:
            logger.warning('Connection to remote proxy failed: %s', exc)
            reply = (
                REPLY_CONNECTION_REFUSED
                if isinstance(exc, ConnectionRefusedError)
                else REPLY_GENERAL_FAILURE
            )
            with _suppress_closed():
                await self._send_reply(client_writer, reply)
        except asyncio.CancelledError:
            raise
        except Exception:
            logger.exception('Unexpected error in client handler')
        finally:
            await _close_writer(client_writer)
            if remote_writer is not None:
                await _close_writer(remote_writer)

    async def _accept_local_handshake(
        self,
        reader: asyncio.StreamReader,
        writer: asyncio.StreamWriter,
    ) -> tuple[bytes, int]:
        """Accept the SOCKS5 greeting from Chrome (no-auth) and read the
        CONNECT request.

        Returns ``(addr_payload, dest_port)`` where *addr_payload* is the raw
        SOCKS5 address field (ATYP byte + address bytes) exactly as Chrome
        sent it, ready to be forwarded verbatim to the remote proxy."""
        try:
            header = await _read_exact(reader, 2, peer='client')
        except _HandshakeError as exc:
            raise _HandshakeError(str(exc), send_reply=False) from exc
        version, nmethods = header[0], header[1]
        if version != SOCKS5_VERSION:
            raise _HandshakeError(
                f'Unsupported SOCKS version from client: {version}', send_reply=False
            )

        try:
            methods = await _read_exact(reader, nmethods, peer='client')
        except _HandshakeError as exc:
            raise _HandshakeError(str(exc), send_reply=False) from exc
        if AUTH_NO_AUTH not in methods:
            writer.write(bytes([SOCKS5_VERSION, AUTH_NO_ACCEPTABLE]))
            await writer.drain()
            raise _HandshakeError('Client does not offer no-auth method', send_reply=False)

        writer.write(bytes([SOCKS5_VERSION, AUTH_NO_AUTH]))
        await writer.drain()

        req = await _read_exact(reader, 4, peer='client')
        if req[0] != SOCKS5_VERSION:
            raise _HandshakeError('Bad SOCKS version in request')
        if req[1] != CMD_CONNECT:
            raise _HandshakeError(
                f'Unsupported command: {req[1]}',
                reply_code=REPLY_COMMAND_NOT_SUPPORTED,
            )

        atyp = req[3]
        addr_payload = await self._read_raw_address(reader, atyp, peer='client')
        dest_port = struct.unpack('!H', await _read_exact(reader, 2, peer='client'))[0]
        logger.debug('Client CONNECT to %s port %d', addr_payload.hex(), dest_port)
        return addr_payload, dest_port

    async def _remote_handshake(
        self,
        reader: asyncio.StreamReader,
        writer: asyncio.StreamWriter,
        addr_payload: bytes,
        dest_port: int,
    ) -> None:
        """Perform full SOCKS5 handshake with the remote proxy including
        username/password authentication, then send the CONNECT request.

        *addr_payload* is the raw ATYP + address bytes from the client,
        forwarded verbatim so the address type is preserved."""
        greeting = bytes([SOCKS5_VERSION, 0x02, AUTH_NO_AUTH, AUTH_USERNAME_PASSWORD])
        writer.write(greeting)
        await writer.drain()
        logger.debug('-> greeting: %s', greeting.hex())

        resp = await _read_exact(reader, 2, peer='remote proxy')
        logger.debug('<- method selection: %s', resp.hex())

        if resp[0] != SOCKS5_VERSION:
            raise _HandshakeError(f'Remote proxy bad version (response: {resp.hex()})')

        selected_method = resp[1]
        if selected_method == AUTH_NO_ACCEPTABLE:
            raise _HandshakeError('Remote proxy rejected all auth methods')

        if selected_method == AUTH_USERNAME_PASSWORD:
            uname = self.username.encode()
            passwd = self.password.encode()
            auth_req = bytes([0x01, len(uname)]) + uname + bytes([len(passwd)]) + passwd
            writer.write(auth_req)
            await writer.drain()
            logger.debug('-> auth request: ulen=%d plen=%d', len(uname), len(passwd))

            auth_resp = await _read_exact(reader, 2, peer='remote proxy')
            logger.debug('<- auth response: %s', auth_resp.hex())
            if auth_resp[1] != 0x00:
                raise _HandshakeError(
                    f'Remote proxy authentication failed (status: {auth_resp[1]:#04x})'
                )
        elif selected_method == AUTH_NO_AUTH:
            logger.debug('Remote proxy selected no-auth (0x00)')
        else:
            raise _HandshakeError(
                f'Remote proxy selected unsupported method: {selected_method:#04x}'
            )

        connect_req = bytes([SOCKS5_VERSION, CMD_CONNECT, 0x00])
        connect_req += addr_payload
        connect_req += struct.pack('!H', dest_port)
        writer.write(connect_req)
        await writer.drain()
        logger.debug('-> CONNECT: %s', connect_req.hex())

        reply_header = await _read_exact(reader, 4, peer='remote proxy')
        logger.debug('<- reply header: %s', reply_header.hex())

        rep = reply_header[1]
        if rep != REPLY_SUCCESS:
            extra = b''
            try:
                extra = await asyncio.wait_for(reader.read(256), timeout=0.5)
            except (asyncio.TimeoutError, OSError):
                pass
            raise _HandshakeError(
                f'Remote proxy CONNECT failed '
                f'(rep={rep:#04x}, reply: {reply_header.hex()}, '
                f'extra: {extra.hex() if extra else "none"})',
                reply_code=rep,
            )

        atyp = reply_header[3]
        await self._read_raw_address(reader, atyp, peer='remote proxy')
        await _read_exact(reader, 2, peer='remote proxy')

    @staticmethod
    async def _read_raw_address(
        reader: asyncio.StreamReader,
        atyp: int,
        *,
        peer: str = 'peer',
    ) -> bytes:
        """Read a SOCKS5 address field and return raw bytes including the
        ATYP prefix, suitable for forwarding verbatim to another proxy."""
        if atyp == ATYP_IPV4:
            raw = await _read_exact(reader, 4, peer=peer)
            return bytes([atyp]) + raw
        if atyp == ATYP_DOMAIN:
            length_byte = await _read_exact(reader, 1, peer=peer)
            domain = await _read_exact(reader, length_byte[0], peer=peer)
            return bytes([atyp]) + length_byte + domain
        if atyp == ATYP_IPV6:
            raw = await _read_exact(reader, 16, peer=peer)
            return bytes([atyp]) + raw
        raise _HandshakeError(
            f'Unsupported address type: {atyp}',
            reply_code=REPLY_ADDRESS_TYPE_NOT_SUPPORTED,
        )

    @staticmethod
    async def _send_reply(
        writer: asyncio.StreamWriter,
        reply_code: int,
    ) -> None:
        """Send a minimal SOCKS5 reply to the client."""
        writer.write(
            bytes([
                SOCKS5_VERSION,
                reply_code,
                0x00,
                ATYP_IPV4,
                0,
                0,
                0,
                0,
                0,
                0,
            ])
        )
        await writer.drain()


class _HandshakeError(Exception):
    """Raised when a SOCKS5 handshake step fails."""

    def __init__(
        self,
        message: str,
        reply_code: int = REPLY_GENERAL_FAILURE,
        send_reply: bool = True,
    ) -> None:
        super().__init__(message)
        self.reply_code = reply_code
        self.send_reply = send_reply


async def _read_exact(reader: asyncio.StreamReader, n: int, *, peer: str = 'peer') -> bytes:
    """Read exactly *n* bytes or raise ``_HandshakeError``."""
    try:
        return await asyncio.wait_for(reader.readexactly(n), timeout=HANDSHAKE_TIMEOUT)
    except asyncio.IncompleteReadError as exc:
        raise _HandshakeError(
            f'Connection closed prematurely (expected {n} bytes, '
            f'got {len(exc.partial)} from {peer})'
        ) from exc
    except asyncio.TimeoutError as exc:
        raise _HandshakeError(
            f'Timed out reading {n} bytes from {peer}',
        ) from exc


async def _skip_bnd_address(reader: asyncio.StreamReader, atyp: int, *, peer: str = 'peer') -> None:
    """Consume BND.ADDR + BND.PORT from a SOCKS5 reply."""
    if atyp == ATYP_IPV4:
        await _read_exact(reader, 4 + 2, peer=peer)
    elif atyp == ATYP_DOMAIN:
        length = (await _read_exact(reader, 1, peer=peer))[0]
        await _read_exact(reader, length + 2, peer=peer)
    elif atyp == ATYP_IPV6:
        await _read_exact(reader, 16 + 2, peer=peer)


async def _main(args: argparse.Namespace) -> None:
    forwarder = SOCKS5Forwarder(
        remote_host=args.remote_host,
        remote_port=args.remote_port,
        username=args.username,
        password=args.password,
        local_host=args.local_host,
        local_port=args.local_port,
    )
    await forwarder.start()

    loop = asyncio.get_running_loop()
    stop = loop.create_future()

    try:
        for sig in (signal.SIGINT, signal.SIGTERM):
            loop.add_signal_handler(sig, stop.set_result, None)
    except NotImplementedError:
        pass  # Windows / ProactorEventLoop — fall back to KeyboardInterrupt

    logger.info(
        'Forwarding socks5://127.0.0.1:%s -> socks5://%s:***@%s:%s',
        forwarder.local_port,
        args.username,
        args.remote_host,
        args.remote_port,
    )
    logger.info('Press Ctrl+C to stop.')

    try:
        await stop
    finally:
        await forwarder.stop()


async def _test_negotiate_auth(
    reader: asyncio.StreamReader,
    writer: asyncio.StreamWriter,
    username: str,
    password: str,
) -> bool:
    """Perform greeting + auth for the --test diagnostic. Returns True on success."""
    greeting = bytes([SOCKS5_VERSION, 0x02, AUTH_NO_AUTH, AUTH_USERNAME_PASSWORD])
    writer.write(greeting)
    await writer.drain()
    logger.info('-> Greeting:  %s', greeting.hex())

    resp = await asyncio.wait_for(reader.readexactly(2), timeout=10)
    logger.info('<- Method:    %s  (selected method: %#04x)', resp.hex(), resp[1])

    if resp[0] != SOCKS5_VERSION:
        logger.error('Bad version byte: %#04x', resp[0])
        return False

    if resp[1] == AUTH_USERNAME_PASSWORD:
        uname = username.encode()
        passwd = password.encode()
        auth_req = bytes([0x01, len(uname)]) + uname + bytes([len(passwd)]) + passwd
        writer.write(auth_req)
        await writer.drain()
        logger.info('-> Auth:      ulen=%d plen=%d', len(uname), len(passwd))

        auth_resp = await asyncio.wait_for(reader.readexactly(2), timeout=10)
        logger.info('<- Auth resp: %s  (status: %#04x)', auth_resp.hex(), auth_resp[1])
        if auth_resp[1] != 0x00:
            logger.error('Authentication rejected')
            return False
        logger.info('Authentication succeeded')
    elif resp[1] == AUTH_NO_AUTH:
        logger.info('Proxy selected no-auth')
    elif resp[1] == AUTH_NO_ACCEPTABLE:
        logger.error('Proxy rejected all auth methods')
        return False

    return True


async def _test_connect_and_verify(
    reader: asyncio.StreamReader,
    writer: asyncio.StreamWriter,
) -> bool:
    """Send CONNECT to httpbin.org:80 and verify with an HTTP request."""
    target = b'httpbin.org'
    connect_req = (
        bytes([SOCKS5_VERSION, CMD_CONNECT, 0x00, ATYP_DOMAIN, len(target)])
        + target
        + struct.pack('!H', 80)
    )
    writer.write(connect_req)
    await writer.drain()
    logger.info('-> CONNECT:   %s  (httpbin.org:80)', connect_req.hex())

    reply = await asyncio.wait_for(reader.readexactly(4), timeout=15)
    logger.info('<- Reply:     %s  (rep: %#04x)', reply.hex(), reply[1])

    if reply[1] != REPLY_SUCCESS:
        extra = b''
        try:
            extra = await asyncio.wait_for(reader.read(256), timeout=1)
        except (asyncio.TimeoutError, OSError):
            pass
        logger.error('CONNECT rejected — reply code %#04x', reply[1])
        if extra:
            logger.error('Extra data: %s', extra.hex())
        logger.error(
            'Possible causes: invalid/expired credentials, quota exceeded, '
            'IP not whitelisted, or wrong port'
        )
        return False

    await _skip_bnd_address(reader, reply[3], peer='remote proxy')
    logger.info('CONNECT established')

    http_req = b'GET /ip HTTP/1.1\r\nHost: httpbin.org\r\nConnection: close\r\n\r\n'
    writer.write(http_req)
    await writer.drain()
    logger.info('-> HTTP GET /ip sent')

    http_resp = await asyncio.wait_for(reader.read(4096), timeout=15)
    decoded = http_resp.decode(errors='replace')
    logger.info('<- HTTP response (%d bytes):\n%s', len(http_resp), decoded)
    logger.info('Proxy is fully working!')
    return True


async def _test_proxy(args: argparse.Namespace) -> None:
    """Perform a direct SOCKS5 handshake test against the remote proxy."""
    logger.info('=== SOCKS5 Direct Test: %s:%s ===', args.remote_host, args.remote_port)

    try:
        reader, writer = await asyncio.wait_for(
            asyncio.open_connection(args.remote_host, args.remote_port),
            timeout=HANDSHAKE_TIMEOUT,
        )
    except asyncio.TimeoutError:
        logger.error('TCP connection timed out')
        return
    except OSError as exc:
        logger.error('TCP connection failed: %s', exc)
        return

    logger.info('TCP connection established')

    try:
        if not await _test_negotiate_auth(reader, writer, args.username, args.password):
            return
        await _test_connect_and_verify(reader, writer)
    except _HandshakeError as exc:
        logger.error('SOCKS5 test failed: %s', exc)
    except asyncio.TimeoutError:
        logger.error('Timed out waiting for proxy response')
    except asyncio.IncompleteReadError as exc:
        logger.error('Connection closed prematurely (got %d bytes)', len(exc.partial))
    except OSError as exc:
        logger.error('Network error: %s', exc)
    finally:
        await _close_writer(writer)


def cli() -> None:
    parser = argparse.ArgumentParser(
        description='Local SOCKS5 forwarder for authenticated remote proxies.',
    )
    parser.add_argument('--remote-host', required=True, help='Remote SOCKS5 proxy host')
    parser.add_argument('--remote-port', type=int, default=1080, help='Remote SOCKS5 proxy port')
    parser.add_argument('--username', required=True, help='Remote proxy username')
    parser.add_argument('--password', required=True, help='Remote proxy password')
    parser.add_argument('--local-host', default='127.0.0.1', help='Local bind address')
    parser.add_argument('--local-port', type=int, default=1081, help='Local bind port (0 = random)')
    parser.add_argument('--verbose', '-v', action='store_true', help='Enable debug logging')
    parser.add_argument(
        '--test',
        action='store_true',
        help='Test the remote proxy directly (no local server, no Chrome needed)',
    )
    args = parser.parse_args()

    logging.basicConfig(
        level=logging.DEBUG if args.verbose else logging.INFO,
        format='%(asctime)s [%(levelname)s] %(name)s: %(message)s',
    )

    if args.test:
        asyncio.run(_test_proxy(args))
    else:
        asyncio.run(_main(args))


if __name__ == '__main__':
    cli()


================================================
FILE: pydoll/utils/user_agent_parser.py
================================================
import re
from dataclasses import dataclass, field

from pydoll.protocol.emulation.types import UserAgentBrandVersion, UserAgentMetadata

_CHROME_RE = re.compile(r'Chrome/(\d+)\.(\d+)\.(\d+)\.(\d+)')
_EDGE_RE = re.compile(r'Edg/(\d+)\.(\d+)\.(\d+)\.(\d+)')

_GREASE_BRANDS = [
    'Not/A)Brand',
    'Not A;Brand',
    'Not.A/Brand',
    'Not)A;Brand',
    'Not=A?Brand',
]

_GREASE_MODULO = 100

_PLATFORM_MAP = {
    'windows': 'Win32',
    'macintosh': 'MacIntel',
    'linux': 'Linux x86_64',
    'android': 'Linux armv81',
    'iphone': 'iPhone',
    'ipad': 'iPad',
    'cros': 'Linux x86_64',
}

_UA_PLATFORM_MAP = {
    'windows': 'Windows',
    'macintosh': 'macOS',
    'linux': 'Linux',
    'android': 'Android',
    'iphone': 'iOS',
    'ipad': 'iOS',
    'cros': 'Chrome OS',
}

_ARCHITECTURE_MAP = {
    'windows': 'x86',
    'macintosh': 'arm',
    'linux': 'x86',
    'android': 'arm',
    'iphone': 'arm',
    'ipad': 'arm',
    'cros': 'x86',
}

_WINDOWS_VERSION_MAP = {
    '6.1': '0.1.0',
    '6.2': '0.2.0',
    '6.3': '0.3.0',
    '10.0': '15.0.0',
}

_DEFAULT_PLATFORM_VERSIONS = {
    'windows': '15.0.0',
    'macintosh': '14.0.0',
    'android': '14.0.0',
    'iphone': '17.0.0',
    'ipad': '17.0.0',
    'linux': '6.1.0',
    'cros': '14541.0.0',
}

_OS_KEYWORDS = [
    ('android', 'android'),
    ('iphone', 'iphone'),
    ('ipad', 'ipad'),
    ('cros', 'cros'),
    ('windows', 'windows'),
    ('macintosh', 'macintosh'),
    ('mac os x', 'macintosh'),
    ('linux', 'linux'),
]

_MOBILE_KEYWORDS = frozenset({'mobile', 'android', 'iphone', 'ipad'})

_VERSION_PATTERNS = {
    'windows': (r'Windows NT (\d+\.\d+)', None),
    'macintosh': (r'Mac OS X (\d+)[_.](\d+)[_.]?(\d+)?', None),
    'android': (r'Android (\d+(?:\.\d+)*)', None),
    'iphone': (r'OS (\d+)[_.](\d+)[_.]?(\d+)?', None),
    'ipad': (r'OS (\d+)[_.](\d+)[_.]?(\d+)?', None),
}


@dataclass
class ParsedUserAgent:
    """Result of parsing a User-Agent string into consistent metadata."""

    platform: str
    vendor: str
    app_version: str
    user_agent_metadata: UserAgentMetadata
    navigator_override_js: str = field(default='', repr=False)


class UserAgentParser:
    """Stateless parser that extracts consistent metadata from a User-Agent string.

    Given a UA string like:
        Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36
        (KHTML, like Gecko) Chrome/120.0.6099.109 Safari/537.36

    It produces all the metadata needed for CDP Emulation.setUserAgentOverride
    and JavaScript navigator property overrides, ensuring full consistency
    between HTTP headers and JS properties.
    """

    @staticmethod
    def parse(user_agent: str) -> ParsedUserAgent:
        """Parse a User-Agent string into consistent browser metadata.

        Args:
            user_agent: Full User-Agent string.

        Returns:
            ParsedUserAgent with platform, vendor, appVersion,
            userAgentMetadata, and JS override script.
        """
        os_key = UserAgentParser._detect_os_key(user_agent)
        browser_name, major_version, full_version = UserAgentParser._detect_browser(user_agent)
        is_mobile = UserAgentParser._detect_mobile(user_agent)
        metadata = UserAgentParser._build_metadata(
            user_agent, os_key, browser_name, major_version, full_version, is_mobile
        )
        vendor = 'Google Inc.'
        app_version = UserAgentParser._build_app_version(user_agent)

        return ParsedUserAgent(
            platform=_PLATFORM_MAP.get(os_key, 'Win32'),
            vendor=vendor,
            app_version=app_version,
            user_agent_metadata=metadata,
            navigator_override_js=UserAgentParser._build_navigator_override_js(vendor, app_version),
        )

    @staticmethod
    def _build_metadata(
        user_agent: str,
        os_key: str,
        browser_name: str,
        major_version: str,
        full_version: str,
        is_mobile: bool,
    ) -> UserAgentMetadata:
        return UserAgentMetadata(
            platform=_UA_PLATFORM_MAP.get(os_key, 'Windows'),
            platformVersion=UserAgentParser._get_platform_version(user_agent, os_key),
            architecture=_ARCHITECTURE_MAP.get(os_key, 'x86'),
            model=UserAgentParser._extract_model(user_agent) if is_mobile else '',
            mobile=is_mobile,
            brands=UserAgentParser._build_brands(browser_name, major_version),
            fullVersionList=UserAgentParser._build_full_version_list(browser_name, full_version),
            bitness='64',
            wow64=False,
        )

    @staticmethod
    def _detect_os_key(user_agent: str) -> str:
        ua_lower = user_agent.lower()
        for keyword, os_key in _OS_KEYWORDS:
            if keyword in ua_lower:
                return os_key
        return 'windows'

    @staticmethod
    def _detect_browser(user_agent: str) -> tuple[str, str, str]:
        edge_match = _EDGE_RE.search(user_agent)
        if edge_match:
            return 'Microsoft Edge', edge_match.group(1), '.'.join(edge_match.groups())

        chrome_match = _CHROME_RE.search(user_agent)
        if chrome_match:
            return (
                'Google Chrome',
                chrome_match.group(1),
                '.'.join(chrome_match.groups()),
            )

        return 'Google Chrome', '120', '120.0.0.0'

    @staticmethod
    def _detect_mobile(user_agent: str) -> bool:
        ua_lower = user_agent.lower()
        return any(keyword in ua_lower for keyword in _MOBILE_KEYWORDS)

    @staticmethod
    def _build_app_version(user_agent: str) -> str:
        if user_agent.startswith('Mozilla/'):
            return user_agent[len('Mozilla/') :]
        return user_agent

    @staticmethod
    def _get_platform_version(user_agent: str, os_key: str) -> str:
        default = _DEFAULT_PLATFORM_VERSIONS.get(os_key, '0.0.0')

        if os_key == 'windows':
            return UserAgentParser._parse_windows_version(user_agent, default)

        if os_key in {'macintosh', 'iphone', 'ipad'}:
            pattern = _VERSION_PATTERNS[os_key][0]
            return UserAgentParser._parse_dotted_version(user_agent, pattern, default)

        if os_key == 'android':
            match = re.search(r'Android (\d+(?:\.\d+)*)', user_agent)
            return match.group(1) if match else default

        return default

    @staticmethod
    def _parse_windows_version(user_agent: str, default: str) -> str:
        match = re.search(r'Windows NT (\d+\.\d+)', user_agent)
        if not match:
            return default
        return _WINDOWS_VERSION_MAP.get(match.group(1), '15.0.0')

    @staticmethod
    def _parse_dotted_version(user_agent: str, pattern: str, default: str) -> str:
        match = re.search(pattern, user_agent)
        if not match:
            return default
        major = match.group(1)
        minor = match.group(2)
        patch = match.group(3) or '0'
        return f'{major}.{minor}.{patch}'

    @staticmethod
    def _build_grease(major_int: int) -> tuple[str, str, str]:
        """Build GREASE brand, short version, and full version."""
        grease_index = major_int % len(_GREASE_BRANDS)
        brand = _GREASE_BRANDS[grease_index]
        short_ver = str(major_int % _GREASE_MODULO) if major_int >= _GREASE_MODULO else '99'
        full_ver = (
            f'{major_int % _GREASE_MODULO}.0.0.0' if major_int >= _GREASE_MODULO else '99.0.0.0'
        )
        return brand, short_ver, full_ver

    @staticmethod
    def _build_brands(browser_name: str, major_version: str) -> list[UserAgentBrandVersion]:
        major_int = int(major_version) if major_version.isdigit() else 120
        grease_brand, grease_version, _ = UserAgentParser._build_grease(major_int)

        brands: list[UserAgentBrandVersion] = [
            UserAgentBrandVersion(brand=grease_brand, version=grease_version),
            UserAgentBrandVersion(brand='Chromium', version=major_version),
        ]

        if browser_name in {'Google Chrome', 'Microsoft Edge'}:
            brands.append(UserAgentBrandVersion(brand=browser_name, version=major_version))

        return brands

    @staticmethod
    def _build_full_version_list(
        browser_name: str, full_version: str
    ) -> list[UserAgentBrandVersion]:
        major = full_version.split('.')[0] if '.' in full_version else full_version
        major_int = int(major) if major.isdigit() else 120
        grease_brand, _, grease_full_version = UserAgentParser._build_grease(major_int)

        versions: list[UserAgentBrandVersion] = [
            UserAgentBrandVersion(brand=grease_brand, version=grease_full_version),
            UserAgentBrandVersion(brand='Chromium', version=full_version),
        ]

        if browser_name in {'Google Chrome', 'Microsoft Edge'}:
            versions.append(UserAgentBrandVersion(brand=browser_name, version=full_version))

        return versions

    @staticmethod
    def _extract_model(user_agent: str) -> str:
        match = re.search(r';\s*([A-Za-z0-9_ ]+)\s*Build/', user_agent)
        if match:
            return match.group(1).strip()
        return ''

    @staticmethod
    def _build_navigator_override_js(vendor: str, app_version: str) -> str:
        safe_vendor = vendor.replace("'", "\\'")
        safe_app_version = app_version.replace('\\', '\\\\').replace("'", "\\'")
        return (
            "Object.defineProperty(Navigator.prototype, 'vendor', "
            f"{{get: () => '{safe_vendor}'}});\n"
            "Object.defineProperty(Navigator.prototype, 'appVersion', "
            f"{{get: () => '{safe_app_version}'}});"
        )


================================================
FILE: pyproject.toml
================================================
[tool.poetry]
name = "pydoll-python"
version = "2.21.3"
description = "Pydoll is a library for automating chromium-based browsers without a WebDriver, offering realistic interactions."
authors = ["Thalison Fernandes <thalissfernandes99@gmail.com>"]
readme = "README.md"
packages = [
    {include = "pydoll"}
]
include = ["pydoll/py.typed"]

[tool.poetry.dependencies]
python = "^3.10"
websockets = "^14"
aiohttp = "^3.9.5"
aiofiles = "^25.1.0"
typing_extensions = "^4.14.0"


[tool.poetry.group.dev.dependencies]
ruff = "^0.7.1"
pytest = "^8.3.3"
taskipy = "^1.14.0"
pytest-asyncio = "^0.24.0"
pytest-cov = "^6.0.0"
aioresponses = "^0.7.7"
mkdocs = "^1.6.1"
mkdocs-material = "^9.6.11"
pymdown-extensions = "^10.14.3"
mkdocstrings = {extras = ["python"], version = "^0.29.1"}
griffe-typingdoc = "^0.2.8"
mkdocs-static-i18n = "^1.3.0"

[build-system]
requires = ["poetry-core"]
build-backend = "poetry.core.masonry.api"

[tool.ruff]
line-length = 100
target-version = "py310"


[tool.ruff.lint]
preview = true
select = ['I', 'F', 'E', 'W', 'PL', 'PT']
ignore = ['PLR0913', 'PLR0917', 'PLR0904', 'E701']
exclude = ['tests', 'tests/*']

[tool.ruff.format]
preview = true
quote-style = 'single'
docstring-code-format = true
docstring-code-line-length = 79
exclude = ['tests', 'tests/*']

[tool.pytest.ini_options]
pythonpath = "."
addopts = '-p no:warnings'

[tool.taskipy.tasks]
lint = 'ruff check .; ruff check . --diff'
format = 'ruff check . --fix; ruff format .'
test = 'pytest -s -x --cov=pydoll -vv'
post_test = 'coverage html'

[tool.mypy]
exclude = [
    "tests/",
]


================================================
FILE: tests/conftest.py
================================================
"""Shared pytest fixtures for all tests."""

import pytest

from pydoll.browser.options import ChromiumOptions as Options


@pytest.fixture
def ci_chrome_options():
    """Chrome options optimized for CI environments."""
    options = Options()
    options.headless = True
    options.start_timeout = 60  # Increased timeout for CI

    # CI-specific arguments - essentials only
    options.add_argument('--no-sandbox')
    options.add_argument('--disable-dev-shm-usage')
    options.add_argument('--disable-gpu')
    options.add_argument('--disable-extensions')
    options.add_argument('--disable-background-timer-throttling')
    options.add_argument('--disable-backgrounding-occluded-windows')
    options.add_argument('--disable-renderer-backgrounding')
    options.add_argument('--disable-default-apps')

    # Memory optimization
    options.add_argument('--memory-pressure-off')
    options.add_argument('--max_old_space_size=4096')

    return options


================================================
FILE: tests/pages/oopif/oopif_content.html
================================================
<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <title>OOPIF Content</title>
    <style>
        body { font-family: sans-serif; padding: 10px; }
        .click-counter { color: green; font-weight: bold; }
    </style>
</head>
<body>
    <h1 id="oopif-heading">Cross-Origin Content</h1>
    <p id="oopif-text">Content from different origin</p>

    <button id="oopif-btn">OOPIF Button</button>
    <span id="oopif-btn-count" class="click-counter">0</span>

    <!-- Nested iframe (same origin as this content page) -->
    <iframe id="nested-iframe" src="oopif_nested.html"
            style="width:600px;height:200px;border:1px solid #666;"></iframe>

    <!-- Shadow root with elements and a nested iframe -->
    <div id="shadow-host"></div>

    <script>
        // Click counter
        (function() {
            var count = 0;
            document.getElementById('oopif-btn').addEventListener('click', function() {
                count++;
                document.getElementById('oopif-btn-count').textContent = String(count);
            });
        })();

        // Shadow root containing text, button, and a nested iframe
        (function() {
            var host = document.getElementById('shadow-host');
            var shadow = host.attachShadow({ mode: 'open' });
            shadow.innerHTML = [
                '<p id="shadow-text">Shadow content inside OOPIF</p>',
                '<button id="shadow-btn">Shadow Button</button>',
                '<span id="shadow-btn-count" class="click-counter">0</span>',
                '<iframe id="shadow-iframe" src="oopif_shadow_iframe.html" ',
                'style="width:500px;height:150px;border:1px solid #999;"></iframe>',
            ].join('');

            var count = 0;
            shadow.getElementById('shadow-btn').addEventListener('click', function() {
                count++;
                shadow.getElementById('shadow-btn-count').textContent = String(count);
            });
        })();
    </script>
</body>
</html>


================================================
FILE: tests/pages/oopif/oopif_main.html
================================================
<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <title>OOPIF Test - Main Page</title>
</head>
<body>
    <h1 id="main-heading">Main Page</h1>
    <iframe id="cross-origin-iframe" style="width:800px;height:600px;border:1px solid #ccc;"></iframe>
    <script>
        var port = new URLSearchParams(location.search).get('port');
        if (port) {
            document.getElementById('cross-origin-iframe').src =
                'http://127.0.0.1:' + port + '/oopif_content.html';
        }
    </script>
</body>
</html>


================================================
FILE: tests/pages/oopif/oopif_nested.html
================================================
<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <title>Nested Iframe Content</title>
</head>
<body>
    <h2 id="nested-heading">Nested Iframe Content</h2>
    <p id="nested-text">Nested inside OOPIF</p>
    <input id="nested-input" type="text" placeholder="Type here">
</body>
</html>


================================================
FILE: tests/pages/oopif/oopif_shadow_iframe.html
================================================
<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <title>Shadow Iframe Content</title>
</head>
<body>
    <h2 id="shadow-iframe-heading">Shadow Iframe Content</h2>
    <p id="shadow-iframe-text">Inside iframe within shadow root in OOPIF</p>
    <input id="shadow-iframe-input" type="text" placeholder="Type in shadow iframe">
</body>
</html>


================================================
FILE: tests/pages/shadow_dom_test.html
================================================
<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <title>Shadow DOM Test Page</title>
</head>
<body>
    <h1>Shadow DOM Test</h1>

    <div id="open-host"></div>
    <div id="closed-host"></div>
    <div id="nested-host"></div>

    <script>
        // Open shadow root
        const openHost = document.getElementById('open-host');
        const openShadow = openHost.attachShadow({ mode: 'open' });
        openShadow.innerHTML = `
            <style>p { color: blue; }</style>
            <p class="open-text">Open shadow content</p>
            <button id="open-btn" class="shadow-btn">Open Button</button>
            <input type="email" name="open-email" placeholder="open email">
        `;

        // Closed shadow root
        const closedHost = document.getElementById('closed-host');
        const closedShadow = closedHost.attachShadow({ mode: 'closed' });
        closedShadow.innerHTML = `
            <style>p { color: red; }</style>
            <p class="closed-text">Closed shadow content</p>
            <button id="closed-btn" class="shadow-btn">Closed Button</button>
            <input type="password" name="closed-pass" placeholder="closed password">
        `;

        // Nested: outer open -> inner component with closed shadow
        const nestedHost = document.getElementById('nested-host');
        const outerShadow = nestedHost.attachShadow({ mode: 'open' });
        outerShadow.innerHTML = `
            <p class="outer-text">Outer shadow</p>
            <div id="inner-host"></div>
        `;
        const innerHost = outerShadow.getElementById('inner-host');
        const innerShadow = innerHost.attachShadow({ mode: 'closed' });
        innerShadow.innerHTML = `
            <p class="inner-text">Inner closed shadow</p>
            <button id="deep-btn">Deep Button</button>
        `;
    </script>
</body>
</html>


================================================
FILE: tests/pages/test_children.html
================================================
<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <meta name="viewport" content="width=device-width, initial-scale=1.0">
    <title>Test Children Elements</title>
</head>
<body>
    <div id="parent-element">
        <div id="child1" class="child">Child 1</div>
        <span id="child2" class="child">Child 2</span>
        <p id="child3" class="child">Child 3</p>
        <a href="#link1" id="link1" class="link">Link 1</a>
        <a href="#link2" id="link2" class="link">Link 2</a>
        <div id="nested-parent">
            <div id="nested-child1">Nested Child 1</div>
            <span id="nested-child2">Nested Child 2</span>
            <a href="#nested-link" id="nested-link">Nested Link</a>
        </div>
    </div>
    
    <div id="another-parent">
        <button id="button1">Button 1</button>
        <input id="input1" type="text" value="test">
        <a href="#another-link" id="another-link">Another Link</a>
    </div>
</body>
</html>


================================================
FILE: tests/pages/test_click_nested.html
================================================
<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <title>Nested Click Test Page</title>
    <style>
        body { font-family: sans-serif; padding: 20px; }
        .click-counter { color: green; font-weight: bold; }
        .section { margin: 20px 0; padding: 10px; border: 1px solid #ccc; }
    </style>
</head>
<body>
    <h1 id="main-heading">Nested Click Test</h1>

    <!-- Section 1: Regular button with click counter -->
    <div class="section">
        <h2>Regular Element</h2>
        <button id="regular-btn">Regular Button</button>
        <span id="regular-btn-count" class="click-counter">0</span>
    </div>

    <!-- Section 2: Shadow root with button -->
    <div class="section">
        <h2>Shadow Root Element</h2>
        <div id="shadow-host"></div>
    </div>

    <!-- Section 3: Iframe with elements -->
    <div class="section">
        <h2>Iframe Element</h2>
        <iframe id="test-iframe" src="test_click_nested_iframe_content.html"
                style="width: 600px; height: 300px; border: 1px solid #999;"></iframe>
    </div>

    <!-- Section 4: Nested shadow roots -->
    <div class="section">
        <h2>Nested Shadow Roots</h2>
        <div id="nested-shadow-host"></div>
    </div>

    <script>
        // Regular button click counter
        (function() {
            var count = 0;
            document.getElementById('regular-btn').addEventListener('click', function() {
                count++;
                document.getElementById('regular-btn-count').textContent = String(count);
            });
        })();

        // Shadow root with clickable button
        (function() {
            var host = document.getElementById('shadow-host');
            var shadow = host.attachShadow({ mode: 'open' });
            shadow.innerHTML = [
                '<style>.shadow-btn { padding: 8px 16px; cursor: pointer; }</style>',
                '<p class="shadow-text">Content inside shadow root</p>',
                '<button id="shadow-btn" class="shadow-btn">Shadow Button</button>',
                '<span id="shadow-btn-count" class="click-counter">0</span>',
            ].join('');

            var count = 0;
            shadow.getElementById('shadow-btn').addEventListener('click', function() {
                count++;
                shadow.getElementById('shadow-btn-count').textContent = String(count);
            });
        })();

        // Nested shadow roots: outer -> inner with button
        (function() {
            var outerHost = document.getElementById('nested-shadow-host');
            var outerShadow = outerHost.attachShadow({ mode: 'open' });
            outerShadow.innerHTML = [
                '<p class="outer-text">Outer shadow content</p>',
                '<div id="inner-shadow-host"></div>',
            ].join('');

            var innerHost = outerShadow.getElementById('inner-shadow-host');
            var innerShadow = innerHost.attachShadow({ mode: 'closed' });
            innerShadow.innerHTML = [
                '<style>.deep-btn { padding: 8px 16px; cursor: pointer; }</style>',
                '<p class="inner-text">Inner shadow content</p>',
                '<button id="deep-btn" class="deep-btn">Deep Nested Button</button>',
                '<span id="deep-btn-count" class="click-counter">0</span>',
            ].join('');

            var count = 0;
            innerShadow.getElementById('deep-btn').addEventListener('click', function() {
                count++;
                innerShadow.getElementById('deep-btn-count').textContent = String(count);
            });
        })();
    </script>
</body>
</html>


================================================
FILE: tests/pages/test_click_nested_iframe_content.html
================================================
<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <title>Iframe Content with Shadow DOM</title>
    <style>
        body { font-family: sans-serif; padding: 10px; }
        .click-counter { color: green; font-weight: bold; }
    </style>
</head>
<body>
    <h2 id="iframe-heading">Iframe Content</h2>

    <button id="iframe-btn">Iframe Button</button>
    <span id="iframe-btn-count" class="click-counter">0</span>

    <div id="shadow-host-in-iframe"></div>

    <script>
        // Click counter for iframe button
        (function() {
            var count = 0;
            document.getElementById('iframe-btn').addEventListener('click', function() {
                count++;
                document.getElementById('iframe-btn-count').textContent = String(count);
            });
        })();

        // Shadow root inside the iframe
        var host = document.getElementById('shadow-host-in-iframe');
        var shadow = host.attachShadow({ mode: 'open' });
        shadow.innerHTML = [
            '<style>.shadow-btn { padding: 8px 16px; cursor: pointer; }</style>',
            '<p class="shadow-text">Shadow content inside iframe</p>',
            '<button id="shadow-btn-in-iframe" class="shadow-btn">Shadow Button in Iframe</button>',
            '<span id="shadow-btn-count" class="click-counter">0</span>',
        ].join('');

        // Click counter for shadow button inside iframe
        (function() {
            var count = 0;
            shadow.getElementById('shadow-btn-in-iframe').addEventListener('click', function() {
                count++;
                shadow.getElementById('shadow-btn-count').textContent = String(count);
            });
        })();
    </script>
</body>
</html>


================================================
FILE: tests/pages/test_core_simple.html
================================================
<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <title>Core Test Page</title>
    <style>
        .item { color: #333; }
        .list-item { margin: 4px 0; }
        #hidden-button { display: none; }
        #deep-section { margin-top: 16px; }
        #click-area { margin: 12px 0; }
        #btn-1 { padding: 6px 10px; cursor: pointer; }
        #simple-select { margin-top: 8px; }
    </style>
    <script>
        document.addEventListener('DOMContentLoaded', function(){
            // click counter
            var count = 0;
            var btn = document.getElementById('btn-1');
            var counter = document.getElementById('btn-1-count');
            btn.addEventListener('click', function(){
                count += 1;
                counter.textContent = String(count);
            });
        });
    </script>
    <!-- Ensure ready -->
</head>
<body>
    <h1 id="main-heading">Core Test Page</h1>

    <div id="content">
        <p id="intro" class="item">This page is used by core integration tests.</p>

        <div id="click-area">
            <button id="btn-1" name="primary-button" class="action-btn">Click Me</button>
            <span id="btn-1-count">0</span>
        </div>

        <form id="form">
            <input id="text-input" name="username" type="text" placeholder="Type your name">
            <textarea id="text-area" name="message" placeholder="Type your message"></textarea>
        </form>

        <div id="list-container">
            <ul id="list">
                <li id="li-1" class="list-item item">Item 1</li>
                <li id="li-2" class="list-item item">Item 2</li>
                <li id="li-3" class="list-item item">Item 3</li>
            </ul>
        </div>

        <div id="deep-section">
            <div id="level1">
                <div id="level2">
                    <div id="level3">
                        <span id="deep-span">Deep nested element</span>
                    </div>
                </div>
            </div>
        </div>

        <div id="select-container">
            <label for="simple-select">Choose:</label>
            <select id="simple-select" name="choices">
                <option value="alpha">Alpha</option>
                <option value="beta">Beta</option>
                <option value="gamma">Gamma</option>
            </select>
        </div>

        <button id="hidden-button" class="action-btn">Hidden</button>
    </div>
</body>
</html>


================================================
FILE: tests/pages/test_frame_content.html
================================================
<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <title>Frame Content</title>
</head>
<body>
    <h1 id="frame-heading">Frame Content</h1>
    <p id="frame-paragraph">This is content inside a frame.</p>
    <input id="frame-input" type="text" placeholder="Frame input">
    <button id="frame-button">Frame Button</button>
</body>
</html>


================================================
FILE: tests/pages/test_frameset.html
================================================
<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <title>Test Frameset</title>
</head>
<frameset cols="50%,50%">
    <frame id="left-frame" src="test_frame_content.html" name="leftFrame">
    <frame id="right-frame" src="test_iframe_content.html" name="rightFrame">
</frameset>
</html>


================================================
FILE: tests/pages/test_har_recording.html
================================================
<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <title>HAR Recording Test Page</title>
    <style>
        body { font-family: sans-serif; margin: 20px; }
        #status { margin-top: 10px; }
        .result { margin: 5px 0; font-family: monospace; font-size: 13px; }
    </style>
</head>
<body>
    <h1 id="heading">HAR Recording Test</h1>
    <div id="status">waiting</div>
    <div id="results"></div>

    <script>
        // The base URL is injected via query param: ?base=http://localhost:PORT
        const params = new URLSearchParams(window.location.search);
        const base = params.get('base');

        async function runRequests() {
            const results = document.getElementById('results');
            const status = document.getElementById('status');

            if (!base) {
                status.textContent = 'error: no base URL';
                return;
            }

            const endpoints = [
                { path: '/api/users', label: 'GET /api/users' },
                { path: '/api/data', label: 'GET /api/data' },
                {
                    path: '/api/submit',
                    label: 'POST /api/submit',
                    options: {
                        method: 'POST',
                        headers: { 'Content-Type': 'application/json' },
                        body: JSON.stringify({ key: 'value' })
                    }
                }
            ];

            for (const ep of endpoints) {
                try {
                    const resp = await fetch(base + ep.path, ep.options || {});
                    const text = await resp.text();
                    const div = document.createElement('div');
                    div.className = 'result';
                    div.textContent = `${ep.label}: ${resp.status} - ${text.substring(0, 80)}`;
                    results.appendChild(div);
                } catch (e) {
                    const div = document.createElement('div');
                    div.className = 'result';
                    div.textContent = `${ep.label}: ERROR - ${e.message}`;
                    results.appendChild(div);
                }
            }

            status.textContent = 'done';
        }

        window.addEventListener('load', runRequests);
    </script>
</body>
</html>


================================================
FILE: tests/pages/test_iframe_content.html
================================================
<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <meta name="viewport" content="width=device-width, initial-scale=1.0">
    <title>Iframe Content</title>
    <style>
        body {
            font-family: Arial, sans-serif;
            padding: 20px;
        }
        .hidden {
            display: none;
        }
    </style>
</head>
<body>
    <h1 id="iframe-heading">Iframe Content</h1>
    
    <div id="iframe-container">
        <p id="iframe-paragraph">This is content inside the iframe.</p>
        
        <form id="iframe-form">
            <label for="iframe-input">Name:</label>
            <input id="iframe-input" type="text" name="name" placeholder="Enter your name">
            
            <label for="iframe-email">Email:</label>
            <input id="iframe-email" type="email" name="email" placeholder="Enter your email">
            
            <label for="iframe-textarea">Message:</label>
            <textarea id="iframe-textarea" name="message" rows="4">Default message</textarea>
            
            <button id="iframe-submit" type="submit">Submit</button>
            <button id="iframe-reset" type="reset">Reset</button>
        </form>
        
        <div id="iframe-links">
            <a href="#link1" id="iframe-link1" class="iframe-link">Link 1</a>
            <a href="#link2" id="iframe-link2" class="iframe-link">Link 2</a>
            <a href="#link3" id="iframe-link3" class="iframe-link">Link 3</a>
        </div>
        
        <div id="iframe-buttons">
            <button id="iframe-button1" class="action-btn">Button 1</button>
            <button id="iframe-button2" class="action-btn">Button 2</button>
            <button id="iframe-button3" class="action-btn hidden">Hidden Button</button>
        </div>
        
        <div id="iframe-list">
            <ul>
                <li id="item1" class="list-item">Item 1</li>
                <li id="item2" class="list-item">Item 2</li>
                <li id="item3" class="list-item">Item 3</li>
            </ul>
        </div>
        
        <select id="iframe-select">
            <option value="option1">Option 1</option>
            <option value="option2" selected>Option 2</option>
            <option value="option3">Option 3</option>
        </select>
        
        <div id="nested-elements">
            <div id="level1">
                <div id="level2">
                    <div id="level3">
                        <span id="deep-span">Deep nested element</span>
                    </div>
                </div>
            </div>
        </div>
    </div>
    
    <script>
        // Add some interactivity
        document.getElementById('iframe-submit').addEventListener('click', function(e) {
            e.preventDefault();
            console.log('Form submitted');
        });
        
        document.querySelectorAll('.action-btn').forEach(btn => {
            btn.addEventListener('click', function() {
                console.log('Button clicked:', this.id);
            });
        });
    </script>
</body>
</html>


================================================
FILE: tests/pages/test_iframe_nested.html
================================================
<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <meta name="viewport" content="width=device-width, initial-scale=1.0">
    <title>Test Nested Iframes</title>
</head>
<body>
    <h1 id="main-heading">Main Page with Nested Iframes</h1>
    
    <div id="main-content">
        <p id="main-paragraph">Main page content</p>
        <button id="main-button">Main Button</button>
    </div>
    
    <iframe id="parent-iframe" src="test_iframe_parent_level.html" style="width: 100%; height: 800px;"></iframe>
    
    <div id="after-iframe">
        <p>Content after parent iframe</p>
    </div>
</body>
</html>


================================================
FILE: tests/pages/test_iframe_nested_level.html
================================================
<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <meta name="viewport" content="width=device-width, initial-scale=1.0">
    <title>Nested Iframe Level</title>
    <style>
        body {
            background-color: #e0e0ff;
            padding: 20px;
        }
    </style>
</head>
<body>
    <h3 id="nested-iframe-heading">Nested Iframe Content</h3>
    
    <div id="nested-iframe-content">
        <p id="nested-paragraph">This is the nested iframe level (child of parent iframe).</p>
        <input id="nested-input" type="text" placeholder="Nested input">
        <button id="nested-button">Nested Button</button>
        
        <div id="nested-links">
            <a href="#nested-link1" id="nested-link1">Nested Link 1</a>
            <a href="#nested-link2" id="nested-link2">Nested Link 2</a>
        </div>
        
        <form id="nested-form">
            <input id="nested-form-input" type="text" name="username" placeholder="Username">
            <input id="nested-form-password" type="password" name="password" placeholder="Password">
            <button id="nested-form-submit" type="submit">Login</button>
        </form>
    </div>
</body>
</html>


================================================
FILE: tests/pages/test_iframe_parent_level.html
================================================
<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <meta name="viewport" content="width=device-width, initial-scale=1.0">
    <title>Parent Iframe Level</title>
    <style>
        body {
            background-color: #f0f0f0;
            padding: 20px;
        }
    </style>
</head>
<body>
    <h2 id="parent-iframe-heading">Parent Iframe Content</h2>
    
    <div id="parent-iframe-content">
        <p id="parent-paragraph">This is the parent iframe level.</p>
        <input id="parent-input" type="text" placeholder="Parent input">
        <button id="parent-button">Parent Button</button>
    </div>
    
    <div id="nested-iframe-container">
        <h3>Nested Iframe Below:</h3>
        <iframe id="nested-iframe" src="test_iframe_nested_level.html" style="width: 100%; height: 400px;"></iframe>
    </div>
    
    <div id="parent-footer">
        <p>Parent iframe footer</p>
    </div>
</body>
</html>


================================================
FILE: tests/pages/test_iframe_simple.html
================================================
<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <meta name="viewport" content="width=device-width, initial-scale=1.0">
    <title>Test Simple Iframe</title>
</head>
<body>
    <h1 id="main-heading">Main Page</h1>
    <div id="main-content">
        <p id="main-paragraph">This is the main page content.</p>
        <button id="main-button">Main Button</button>
        <input id="main-input" type="text" placeholder="Main input">
    </div>
    
    <iframe id="simple-iframe" src="test_iframe_content.html" style="width: 800px; height: 600px;"></iframe>
    
    <div id="after-iframe">
        <p>Content after iframe</p>
    </div>
</body>
</html>


================================================
FILE: tests/pages/test_multiple_iframes.html
================================================
<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <meta name="viewport" content="width=device-width, initial-scale=1.0">
    <title>Multiple Iframes Test</title>
    <style>
        body {
            font-family: Arial, sans-serif;
            padding: 20px;
        }
        .iframe-container {
            margin: 20px 0;
            border: 2px solid #333;
            padding: 10px;
        }
        h1, h2 {
            color: #333;
        }
        iframe {
            border: 1px solid #999;
        }
    </style>
</head>
<body>
    <h1 id="main-heading">Multiple Iframes Test Page</h1>
    <p id="main-paragraph">This page contains multiple iframes to test iframe selection.</p>
    
    <div class="iframe-container">
        <h2>First Iframe (Cookie Tracker - should be ignored)</h2>
        <iframe 
            id="cookie-iframe" 
            src="test_iframe_content.html" 
            width="300" 
            height="100"
            data-purpose="cookie-tracking">
        </iframe>
    </div>
    
    <div class="iframe-container">
        <h2>Second Iframe (Login Form - target iframe)</h2>
        <iframe 
            id="login-iframe" 
            src="test_iframe_content.html" 
            width="400" 
            height="300"
            data-purpose="login">
        </iframe>
    </div>
    
    <div class="iframe-container">
        <h2>Third Iframe (Analytics - should be ignored)</h2>
        <iframe 
            id="analytics-iframe" 
            src="test_iframe_content.html" 
            width="300" 
            height="100"
            data-purpose="analytics">
        </iframe>
    </div>
</body>
</html>


================================================
FILE: tests/test_browser/test_browser_base.py
================================================
import asyncio
import base64
from unittest.mock import ANY, AsyncMock, MagicMock, patch

import pytest
import pytest_asyncio

from pydoll import exceptions
from pydoll.browser.chromium.chrome import Chrome
from pydoll.browser.chromium.base import Browser
from pydoll.browser.managers import (
    ProxyManager,
    ChromiumOptionsManager,
    BrowserProcessManager,
    TempDirectoryManager,
)
from pydoll.browser.options import ChromiumOptions as Options
from pydoll.browser.tab import Tab
from pydoll.commands import (
    BrowserCommands,
    FetchCommands,
    RuntimeCommands,
    StorageCommands,
    TargetCommands,
)
from pydoll.protocol.fetch.events import FetchEvent
from pydoll.connection.connection_handler import ConnectionHandler
from pydoll.exceptions import (
    MissingTargetOrWebSocket,
    InvalidWebSocketAddress,
)

from pydoll.protocol.network.types import RequestMethod, ErrorReason
from pydoll.protocol.browser.types import DownloadBehavior, PermissionType

class ConcreteBrowser(Browser):
    def _get_default_binary_location(self) -> str:
        return '/fake/path/to/browser'


@pytest_asyncio.fixture
async def mock_browser():
    with (
        patch.multiple(
            Browser,
            _get_default_binary_location=MagicMock(return_value='/fake/path/to/browser'),
        ),
        patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ) as mock_process_manager,
        patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ) as mock_temp_dir_manager,
        patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ) as mock_conn_handler,
        patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ) as mock_proxy_manager,
    ):
        options = Options()
        options.binary_location = None

        options_manager = ChromiumOptionsManager(options)
        browser = ConcreteBrowser(options_manager)
        browser._browser_process_manager = mock_process_manager.return_value
        browser._temp_directory_manager = mock_temp_dir_manager.return_value
        browser._proxy_manager = mock_proxy_manager.return_value
        browser._connection_handler = mock_conn_handler.return_value
        browser._connection_handler.execute_command = AsyncMock()
        browser._connection_handler.register_callback = AsyncMock()

        mock_temp_dir_manager.return_value.create_temp_dir.return_value = MagicMock(name='temp_dir')

        yield browser


@pytest.mark.asyncio
async def test_browser_initialization(mock_browser):
    assert isinstance(mock_browser.options, Options)
    assert isinstance(mock_browser._proxy_manager, ProxyManager)
    assert isinstance(mock_browser._browser_process_manager, BrowserProcessManager)
    assert isinstance(mock_browser._temp_directory_manager, TempDirectoryManager)
    assert isinstance(mock_browser._connection_handler, ConnectionHandler)
    assert mock_browser._connection_port in range(9223, 9323)


@pytest.mark.asyncio
async def test_start_browser_success(mock_browser):
    mock_browser._connection_handler.ping.return_value = True
    mock_browser._get_valid_tab_id = AsyncMock(return_value='page1')

    tab = await mock_browser.start()
    assert isinstance(tab, Tab)

    mock_browser._browser_process_manager.start_browser_process.assert_called_once_with(
        '/fake/path/to/browser',
        mock_browser._connection_port,
        mock_browser.options.arguments,
    )

    assert '--user-data-dir=' in str(
        mock_browser.options.arguments
    ), 'Temporary directory not configured'


@pytest.mark.asyncio
async def test_start_browser_failure(mock_browser):
    mock_browser._connection_handler.ping.return_value = False
    with patch('pydoll.browser.chromium.base.asyncio.sleep', AsyncMock()) as mock_sleep:
        mock_sleep.return_value = False
        with pytest.raises(exceptions.FailedToStartBrowser):
            await mock_browser.start()


@pytest.mark.asyncio
async def test_start_browser_failure_with_start_timeout(mock_browser):
    browser_launched = False

    async def launch_browser_later():
        nonlocal browser_launched
        await asyncio.sleep(2)
        browser_launched = True

    def start_browser_process_side_effect(*args, **kwargs):
        asyncio.create_task(launch_browser_later())

    async def ping_side_effect():
        nonlocal browser_launched
        return browser_launched

    mock_browser.options.start_timeout = 1
    mock_browser._get_valid_tab_id = AsyncMock(return_value='page1')
    mock_browser._browser_process_manager.start_browser_process.side_effect = (
        start_browser_process_side_effect
    )
    mock_browser._connection_handler.ping = AsyncMock(side_effect=ping_side_effect)

    with pytest.raises(exceptions.FailedToStartBrowser):
        await mock_browser.start()


@pytest.mark.asyncio
async def test_start_browser_success_with_start_timeout(mock_browser):
    browser_launched = False

    async def launch_browser_later():
        nonlocal browser_launched
        await asyncio.sleep(2)
        browser_launched = True

    def start_browser_process_side_effect(*args, **kwargs):
        asyncio.create_task(launch_browser_later())

    async def ping_side_effect():
        nonlocal browser_launched
        return browser_launched

    mock_browser.options.start_timeout = 3
    mock_browser._get_valid_tab_id = AsyncMock(return_value='page1')
    mock_browser._browser_process_manager.start_browser_process.side_effect = (
        start_browser_process_side_effect
    )
    mock_browser._connection_handler.ping = AsyncMock(side_effect=ping_side_effect)

    await mock_browser.start()


@pytest.mark.asyncio
async def test_proxy_configuration(mock_browser):
    mock_browser._proxy_manager.get_proxy_credentials = MagicMock(
        return_value=(True, ('user', 'pass'))
    )
    mock_browser._get_valid_tab_id = AsyncMock(return_value='page1')
    await mock_browser.start()

    mock_browser._connection_handler.execute_command.assert_any_call(
        FetchCommands.enable(handle_auth_requests=True, resource_type=None)
    )
    mock_browser._connection_handler.register_callback.assert_any_call(
        FetchEvent.REQUEST_PAUSED, ANY, True
    )
    mock_browser._connection_handler.register_callback.assert_any_call(
        FetchEvent.AUTH_REQUIRED,
        ANY,
        True,
    )


@pytest.mark.asyncio
async def test_new_tab(mock_browser):
    mock_browser._connection_handler.execute_command.return_value = {
        'result': {'targetId': 'new_page'}
    }
    tab = await mock_browser.new_tab()
    assert tab._target_id == 'new_page'
    assert isinstance(tab, Tab)


@pytest.mark.asyncio
async def test_connect_with_ws_address_returns_tab_and_sets_handler_ws(mock_browser):
    ws_browser = 'ws://localhost:9222/devtools/browser/abcdef'
    mock_browser.get_targets = AsyncMock(return_value=[{'type': 'page', 'url': 'https://example', 'targetId': 'p1'}])
    mock_browser._get_valid_tab_id = AsyncMock(return_value='p1')
    mock_browser._connection_handler._ensure_active_connection = AsyncMock()

    tab = await mock_browser.connect(ws_browser)

    assert mock_browser._ws_address == ws_browser
    assert mock_browser._connection_handler._ws_address == ws_browser
    mock_browser._connection_handler._ensure_active_connection.assert_awaited_once()

    # The returned Tab should connect using page ws address derived from browser ws
    assert isinstance(tab, Tab)
    assert tab._ws_address == 'ws://localhost:9222/devtools/page/p1'


@pytest.mark.asyncio
async def test_connect_with_ws_address_preserves_token_in_tab_ws(mock_browser):
    ws_browser = 'ws://localhost:9222/devtools/browser/abcdef?token=secrettoken'
    mock_browser.get_targets = AsyncMock(return_value=[{'type': 'page', 'url': 'https://example', 'targetId': 'p1'}])
    mock_browser._get_valid_tab_id = AsyncMock(return_value='p1')
    mock_browser._connection_handler._ensure_active_connection = AsyncMock()

    tab = await mock_browser.connect(ws_browser)

    assert mock_browser._ws_address == ws_browser
    assert mock_browser._connection_handler._ws_address == ws_browser
    mock_browser._connection_handler._ensure_active_connection.assert_awaited_once()

    # Token should be preserved in page-level ws URL
    assert isinstance(tab, Tab)
    assert tab._ws_address == 'ws://localhost:9222/devtools/page/p1?token=secrettoken'


@pytest.mark.asyncio
async def test_new_tab_uses_ws_base_when_ws_address_present(mock_browser):
    # Simulate browser connected via ws
    mock_browser._ws_address = 'ws://127.0.0.1:9222/devtools/browser/xyz'
    mock_browser._connection_handler.execute_command.return_value = {
        'result': {'targetId': 'new_page'}
    }

    tab = await mock_browser.new_tab()

    assert isinstance(tab, Tab)
    assert tab._ws_address == 'ws://127.0.0.1:9222/devtools/page/new_page'
    # When ws_address is used, target_id can be known from create_target response
    assert tab._target_id == 'new_page'


@pytest.mark.asyncio
async def test_get_window_id_for_tab_uses_ws_target_when_no_target_id(mock_browser):
    # Tab created only with ws address
    tab = Tab(mock_browser, ws_address='ws://localhost:9222/devtools/page/targetXYZ')
    mock_browser._connection_handler.execute_command.return_value = {
        'result': {'windowId': 'win1'}
    }

    window_id = await mock_browser.get_window_id_for_tab(tab)
    assert window_id == 'win1'
    mock_browser._connection_handler.execute_command.assert_called_with(
        BrowserCommands.get_window_for_target('targetXYZ'), timeout=60
    )


@pytest.mark.asyncio
async def test_cookie_management(mock_browser):
    cookies = [{'name': 'test', 'value': '123'}]
    await mock_browser.set_cookies(cookies)
    mock_browser._connection_handler.execute_command.assert_any_call(
        StorageCommands.set_cookies(cookies=cookies, browser_context_id=None), timeout=60
    )

    mock_browser._connection_handler.execute_command.return_value = {'result': {'cookies': cookies}}
    result = await mock_browser.get_cookies()
    assert result == cookies

    await mock_browser.delete_all_cookies()
    mock_browser._connection_handler.execute_command.assert_any_await(
        StorageCommands.clear_cookies(), timeout=60
    )


@pytest.mark.asyncio
async def test_event_registration(mock_browser):
    callback = MagicMock()
    mock_browser._connection_handler.register_callback.return_value = 123

    callback_id = await mock_browser.on('test_event', callback, temporary=True)
    assert callback_id == 123

    mock_browser._connection_handler.register_callback.assert_called_with('test_event', ANY, True)


@pytest.mark.asyncio
async def test_remove_callback_success(mock_browser):
    """Browser.remove_callback should forward to connection handler and return True."""
    mock_browser._connection_handler.remove_callback = AsyncMock(return_value=True)

    result = await mock_browser.remove_callback(42)

    mock_browser._connection_handler.remove_callback.assert_called_with(42)
    assert result is True


@pytest.mark.asyncio
async def test_remove_callback_false(mock_browser):
    """Browser.remove_callback should return False when handler returns False."""
    mock_browser._connection_handler.remove_callback = AsyncMock(return_value=False)

    result = await mock_browser.remove_callback(77)

    mock_browser._connection_handler.remove_callback.assert_called_with(77)
    assert result is False


@pytest.mark.asyncio
async def test_window_management(mock_browser):
    mock_browser._connection_handler.execute_command.return_value = {
        'result': {'windowId': 'window1'}
    }
    mock_browser.get_window_id = AsyncMock(return_value='window1')

    bounds = {'width': 800, 'height': 600}
    await mock_browser.set_window_bounds(bounds)
    mock_browser._connection_handler.execute_command.assert_any_await(
        BrowserCommands.set_window_bounds('window1', bounds), timeout=60
    )

    await mock_browser.set_window_maximized()
    mock_browser._connection_handler.execute_command.assert_any_await(
        BrowserCommands.set_window_maximized('window1'), timeout=60
    )

    await mock_browser.set_window_minimized()
    mock_browser._connection_handler.execute_command.assert_any_await(
        BrowserCommands.set_window_minimized('window1'), timeout=60
    )


@pytest.mark.asyncio
async def test_get_window_id_for_target(mock_browser):
    mock_browser._connection_handler.ping.return_value = True
    mock_browser._get_valid_tab_id = AsyncMock(return_value='page1')

    tab = await mock_browser.start()
    mock_browser._connection_handler.execute_command.return_value = {
        'result': {'windowId': 'page1'}
    }
    window_id = await mock_browser.get_window_id_for_tab(tab)
    assert window_id == 'page1'
    mock_browser._connection_handler.execute_command.assert_called_with(
        BrowserCommands.get_window_for_target('page1'), timeout=60
    )


@pytest.mark.asyncio
async def test_get_window_id_for_tab_raises_when_no_target_id_and_no_ws(mock_browser):
    # Tab created only with connection_port, without target_id and ws
    tab = Tab(mock_browser, connection_port=9222)
    with pytest.raises(MissingTargetOrWebSocket):
        await mock_browser.get_window_id_for_tab(tab)


def test__validate_ws_address_raises_on_invalid_scheme():
    with pytest.raises(InvalidWebSocketAddress):
        Browser._validate_ws_address('http://localhost:9222/devtools/browser/abc')


def test__validate_ws_address_accepts_ws_scheme():
    Browser._validate_ws_address('ws://localhost:9222/devtools/browser/abc')


def test__validate_ws_address_accepts_wss_scheme():
    Browser._validate_ws_address('wss://connect.browserbase.com/devtools/browser/abc')


def test__validate_ws_address_raises_on_insufficient_slashes():
    with pytest.raises(InvalidWebSocketAddress):
        Browser._validate_ws_address('ws://localhost')


def test__validate_ws_address_raises_on_insufficient_slashes_wss():
    with pytest.raises(InvalidWebSocketAddress):
        Browser._validate_ws_address('wss://localhost')


def test__get_tab_ws_address_raises_when_ws_not_set(mock_browser):
    mock_browser._ws_address = None
    with pytest.raises(InvalidWebSocketAddress):
        mock_browser._get_tab_ws_address('some-tab')


def test__get_tab_ws_address_preserves_query_and_fragment(mock_browser):
    mock_browser._ws_address = 'ws://host:9222/devtools/browser/abc?token=XYZ#frag'
    result = mock_browser._get_tab_ws_address('tab1')
    assert result == 'ws://host:9222/devtools/page/tab1?token=XYZ#frag'


def test__get_tab_ws_address_preserves_wss_scheme(mock_browser):
    mock_browser._ws_address = 'wss://connect.browserbase.com/devtools/browser/abc?token=secret'
    result = mock_browser._get_tab_ws_address('tab1')
    assert result == 'wss://connect.browserbase.com/devtools/page/tab1?token=secret'


@pytest.mark.asyncio
async def test_get_window_id(mock_browser):
    mock_browser.get_targets = AsyncMock(return_value=[{'targetId': 'target1', 'type': 'page'}])
    mock_browser._connection_handler.execute_command.return_value = {
        'result': {'windowId': 'window1'}
    }
    window_id = await mock_browser.get_window_id()
    assert window_id == 'window1'
    mock_browser._connection_handler.execute_command.assert_called_with(
        BrowserCommands.get_window_for_target('target1'), timeout=60
    )


@pytest.mark.asyncio
async def test_stop_browser(mock_browser):
    await mock_browser.stop()
    mock_browser._connection_handler.execute_command.assert_any_await(
        BrowserCommands.close(), timeout=60
    )
    mock_browser._browser_process_manager.stop_process.assert_called_once()
    mock_browser._temp_directory_manager.cleanup.assert_called_once()


@pytest.mark.asyncio
async def test_stop_browser_not_running(mock_browser):
    mock_browser._connection_handler.ping.return_value = False
    with patch('pydoll.browser.chromium.base.asyncio.sleep', AsyncMock()) as mock_sleep:
        mock_sleep.return_value = False
        with pytest.raises(exceptions.BrowserNotRunning):
            await mock_browser.stop()


@pytest.mark.asyncio
async def test_context_manager(mock_browser):
    async with mock_browser as browser:
        assert browser == mock_browser

    mock_browser._temp_directory_manager.cleanup.assert_called_once()
    mock_browser._browser_process_manager.stop_process.assert_called_once()


@pytest.mark.asyncio
async def test_enable_events(mock_browser):
    await mock_browser.enable_fetch_events(handle_auth_requests=True, resource_type='XHR')
    mock_browser._connection_handler.execute_command.assert_called_with(
        FetchCommands.enable(handle_auth_requests=True, resource_type='XHR')
    )


@pytest.mark.asyncio
async def test_disable_events(mock_browser):
    await mock_browser.disable_fetch_events()
    mock_browser._connection_handler.execute_command.assert_called_with(FetchCommands.disable())


@pytest.mark.asyncio
async def test__continue_request_callback(mock_browser):
    await mock_browser._continue_request_callback({'params': {'requestId': 'request1'}})
    mock_browser._connection_handler.execute_command.assert_called_with(
        FetchCommands.continue_request('request1'), timeout=60
    )


@pytest.mark.asyncio
async def test__continue_request_auth_required_callback(mock_browser):
    await mock_browser._continue_request_with_auth_callback(
        event={'params': {'requestId': 'request1'}},
        proxy_username='user',
        proxy_password='pass',
    )

    mock_browser._connection_handler.execute_command.assert_any_call(
        FetchCommands.continue_request_with_auth('request1', 'ProvideCredentials', 'user', 'pass'),
        timeout=60,
    )

    mock_browser._connection_handler.execute_command.assert_any_call(FetchCommands.disable())


def test__is_valid_tab(mock_browser):
    result = mock_browser._is_valid_tab(
        {
            'type': 'page',
            'url': 'chrome://newtab/',
        }
    )
    assert result is True


def test__is_valid_tab_not_a_tab(mock_browser):
    result = mock_browser._is_valid_tab(
        {
            'type': 'tab',
            'url': 'chrome://newtab/',
        }
    )
    assert result is False


@pytest.mark.parametrize(
    'os_name, expected_browser_paths, mock_return_value',
    [
        (
            'Windows',
            [
                r'C:\Program Files\Google\Chrome\Application\chrome.exe',
                r'C:\Program Files (x86)\Google\Chrome\Application\chrome.exe',
            ],
            r'C:\Program Files\Google\Chrome\Application\chrome.exe',
        ),
        ('Linux', ['/usr/bin/google-chrome', '/usr/bin/google-chrome-stable'], '/usr/bin/google-chrome'),
        (
            'Darwin',
            ['/Applications/Google Chrome.app/Contents/MacOS/Google Chrome'],
            '/Applications/Google Chrome.app/Contents/MacOS/Google Chrome',
        ),
    ],
)
@patch('pydoll.browser.chromium.chrome.validate_browser_paths')
@patch('platform.system')
def test__get_default_binary_location(
    mock_platform_system,
    mock_validate_browser_paths,
    os_name,
    expected_browser_paths,
    mock_return_value,
):
    mock_platform_system.return_value = os_name
    mock_validate_browser_paths.return_value = mock_return_value
    path = Chrome._get_default_binary_location()
    mock_validate_browser_paths.assert_called_once_with(expected_browser_paths)

    assert path == mock_return_value


def test__get_default_binary_location_unsupported_os():
    with patch('platform.system', return_value='SomethingElse'):
        with pytest.raises(exceptions.UnsupportedOS, match='Unsupported OS: SomethingElse'):
            Chrome._get_default_binary_location()


@patch('platform.system')
def test__get_default_binary_location_throws_exception_if_os_not_supported(
    mock_platform_system,
):
    mock_platform_system.return_value = 'FreeBSD'

    with pytest.raises(exceptions.UnsupportedOS, match='Unsupported OS: FreeBSD'):
        Chrome._get_default_binary_location()


@pytest.mark.asyncio
async def test_create_browser_context(mock_browser):
    mock_browser._execute_command = AsyncMock()
    mock_browser._execute_command.return_value = {'result': {'browserContextId': 'context1'}}

    context_id = await mock_browser.create_browser_context()
    assert context_id == 'context1'

    mock_browser._execute_command.assert_called_with(TargetCommands.create_browser_context())

    # Test with proxy
    mock_browser._execute_command.return_value = {'result': {'browserContextId': 'context2'}}
    context_id = await mock_browser.create_browser_context(
        proxy_server='http://proxy.example.com:8080', proxy_bypass_list='localhost'
    )
    assert context_id == 'context2'
    mock_browser._execute_command.assert_called_with(
        TargetCommands.create_browser_context(
            proxy_server='http://proxy.example.com:8080', proxy_bypass_list='localhost'
        )
    )


@pytest.mark.asyncio
async def test_create_browser_context_with_private_proxy_sanitizes_and_stores_auth(mock_browser):
    mock_browser._execute_command = AsyncMock()
    mock_browser._execute_command.return_value = {'result': {'browserContextId': 'ctx1'}}

    context_id = await mock_browser.create_browser_context(
        proxy_server='http://user:pass@proxy.example.com:8080',
        proxy_bypass_list='localhost',
    )

    assert context_id == 'ctx1'
    # Should send sanitized proxy (without credentials) to CDP
    mock_browser._execute_command.assert_called_with(
        TargetCommands.create_browser_context(
            proxy_server='http://proxy.example.com:8080', proxy_bypass_list='localhost'
        )
    )
    # Credentials must be stored per-context for later Tab setup
    assert mock_browser._context_proxy_auth['ctx1'] == ('user', 'pass')


@pytest.mark.asyncio
async def test_create_browser_context_with_private_proxy_no_scheme_sanitizes_and_stores_auth(
    mock_browser,
):
    mock_browser._execute_command = AsyncMock()
    mock_browser._execute_command.return_value = {'result': {'browserContextId': 'ctx2'}}

    # Without scheme -> should default to http://
    context_id = await mock_browser.create_browser_context(
        proxy_server='user:pwd@host.local:9000'
    )

    assert context_id == 'ctx2'
    mock_browser._execute_command.assert_called_with(
        TargetCommands.create_browser_context(proxy_server='http://host.local:9000', proxy_bypass_list=None)
    )
    assert mock_browser._context_proxy_auth['ctx2'] == ('user', 'pwd')


@pytest.mark.parametrize(
    'input_proxy, expected_sanitized, expected_creds',
    [
        ('username:password@host:8080', 'http://host:8080', ('username', 'password')),
        ('http://username:password@host:8080', 'http://host:8080', ('username', 'password')),
        ('socks5://user:pass@10.0.0.1:1080', 'socks5://10.0.0.1:1080', ('user', 'pass')),
        ('user@host:3128', 'http://host:3128', ('user', '')),
        ('http://user@host:8080', 'http://host:8080', ('user', '')),
        ('host:3128', 'http://host:3128', None),
    ],
)
def test__sanitize_proxy_and_extract_auth_variants(input_proxy, expected_sanitized, expected_creds):
    sanitized, creds = Browser._sanitize_proxy_and_extract_auth(input_proxy)
    assert sanitized == expected_sanitized
    assert creds == expected_creds


@pytest.mark.asyncio
@patch('pydoll.browser.chromium.base.Tab')
async def test_new_tab_sets_up_context_proxy_auth_handlers(MockTab, mock_browser):
    # Arrange context credentials
    context_id = 'ctx-auth'
    mock_browser._context_proxy_auth[context_id] = ('u1', 'p1')

    # Mock CDP create_target response
    mock_browser._connection_handler.execute_command.return_value = {
        'result': {'targetId': 'new_page_ctx'}
    }

    # Fake Tab with async methods
    fake_tab = MagicMock()
    fake_tab.enable_fetch_events = AsyncMock()
    fake_tab.on = AsyncMock()
    MockTab.return_value = fake_tab

    # Act
    tab = await mock_browser.new_tab(browser_context_id=context_id)

    # Assert: enable fetch events with auth handling
    fake_tab.enable_fetch_events.assert_awaited_once()
    enable_call = fake_tab.enable_fetch_events.await_args
    assert enable_call.kwargs.get('handle_auth') is True

    # Assert: event handlers registered with temporary=True
    from pydoll.protocol.fetch.events import FetchEvent as FE
    # First: request paused
    assert any(
        (c.args[0] == FE.REQUEST_PAUSED and c.kwargs.get('temporary') is True)
        for c in fake_tab.on.await_args_list
    )
    # Second: auth required
    auth_calls = [c for c in fake_tab.on.await_args_list if c.args[0] == FE.AUTH_REQUIRED]
    assert len(auth_calls) == 1
    cb = auth_calls[0].args[1]
    from functools import partial as _partial
    assert isinstance(cb, _partial)
    assert cb.keywords.get('proxy_username') == 'u1'
    assert cb.keywords.get('proxy_password') == 'p1'
    assert cb.keywords.get('tab') is fake_tab

    # Returned tab is the fake
    assert tab is fake_tab


@pytest.mark.asyncio
@patch('pydoll.browser.chromium.base.Tab')
async def test_new_tab_without_context_proxy_auth_does_not_setup_handlers(MockTab, mock_browser):
    # No credentials stored for this context
    context_id = 'ctx-no-auth'
    mock_browser._context_proxy_auth.pop(context_id, None)

    mock_browser._connection_handler.execute_command.return_value = {
        'result': {'targetId': 'new_page2'}
    }

    fake_tab = MagicMock()
    fake_tab.enable_fetch_events = AsyncMock()
    fake_tab.on = AsyncMock()
    MockTab.return_value = fake_tab

    await mock_browser.new_tab(browser_context_id=context_id)

    fake_tab.enable_fetch_events.assert_not_called()
    fake_tab.on.assert_not_called()


@pytest.mark.asyncio
async def test_delete_browser_context(mock_browser):
    mock_browser._execute_command = AsyncMock()
    await mock_browser.delete_browser_context('context1')
    mock_browser._execute_command.assert_called_with(
        TargetCommands.dispose_browser_context('context1')
    )


@pytest.mark.asyncio
async def test_get_browser_contexts(mock_browser):
    mock_browser._execute_command = AsyncMock()
    mock_browser._execute_command.return_value = {
        'result': {'browserContextIds': ['context1', 'context2']}
    }

    contexts = await mock_browser.get_browser_contexts()
    assert contexts == ['context1', 'context2']
    mock_browser._execute_command.assert_called_with(TargetCommands.get_browser_contexts())


@pytest.mark.asyncio
async def test_set_download_behavior(mock_browser):
    await mock_browser.set_download_behavior(
        behavior=DownloadBehavior.ALLOW, download_path='/downloads', events_enabled=True
    )

    mock_browser._connection_handler.execute_command.assert_called_with(
        BrowserCommands.set_download_behavior(
            behavior=DownloadBehavior.ALLOW,
            download_path='/downloads',
            browser_context_id=None,
            events_enabled=True,
        ),
        timeout=60,
    )


@pytest.mark.asyncio
async def test_set_download_path(mock_browser):
    mock_browser._execute_command = AsyncMock()
    await mock_browser.set_download_path(path='/downloads')
    mock_browser._execute_command.assert_called_with(
        BrowserCommands.set_download_behavior(
            behavior=DownloadBehavior.ALLOW,
            download_path='/downloads',
            browser_context_id=None,
        )
    )


@pytest.mark.asyncio
async def test_grant_permissions(mock_browser):
    permissions = [PermissionType.GEOLOCATION, PermissionType.NOTIFICATIONS]

    await mock_browser.grant_permissions(permissions=permissions, origin='https://example.com')

    mock_browser._connection_handler.execute_command.assert_called_with(
        BrowserCommands.grant_permissions(
            permissions=permissions, origin='https://example.com', browser_context_id=None
        ),
        timeout=60,
    )


@pytest.mark.asyncio
async def test_reset_permissions(mock_browser):
    await mock_browser.reset_permissions()

    mock_browser._connection_handler.execute_command.assert_called_with(
        BrowserCommands.reset_permissions(browser_context_id=None), timeout=60
    )


@pytest.mark.asyncio
async def test_get_version(mock_browser):
    mock_browser._connection_handler.execute_command.return_value = {
        'result': {
            'protocolVersion': '1.3',
            'product': 'Chrome/90.0.4430.93',
            'revision': '@abcdef',
            'userAgent': 'Mozilla/5.0...',
            'jsVersion': '9.0',
        }
    }

    version = await mock_browser.get_version()
    assert version['protocolVersion'] == '1.3'
    assert version['product'] == 'Chrome/90.0.4430.93'

    mock_browser._connection_handler.execute_command.assert_called_with(
        BrowserCommands.get_version(), timeout=60
    )


@pytest.mark.asyncio
async def test_headless_mode(mock_browser):
    mock_browser._connection_handler.ping.return_value = True
    mock_browser._get_valid_tab_id = AsyncMock(return_value='page1')

    await mock_browser.start(headless=True)

    assert '--headless' in mock_browser.options.arguments
    mock_browser._browser_process_manager.start_browser_process.assert_called_once()


@pytest.mark.asyncio
async def test_multiple_tab_handling(mock_browser):
    # Simulate getting multiple tabs
    mock_browser._connection_handler.execute_command.side_effect = [
        {'result': {'targetId': 'tab1'}},
        {'result': {'targetId': 'tab2'}},
    ]

    tab1 = await mock_browser.new_tab()
    tab2 = await mock_browser.new_tab()

    assert tab1._target_id == 'tab1'
    assert tab2._target_id == 'tab2'

    # Verify that correct calls were made
    calls = mock_browser._connection_handler.execute_command.call_args_list
    assert len(calls) == 2


# New tests for _get_valid_tab_id
@pytest.mark.asyncio
async def test_get_valid_tab_id_success():
    """Test _get_valid_tab_id with a valid tab."""
    targets = [
        {'type': 'page', 'url': 'https://example.com', 'targetId': 'valid_tab_1'},
        {'type': 'extension', 'url': 'chrome-extension://abc123', 'targetId': 'ext_1'},
        {'type': 'page', 'url': 'chrome://newtab/', 'targetId': 'valid_tab_2'},
    ]

    result = await Browser._get_valid_tab_id(targets)
    assert result == 'valid_tab_1'


@pytest.mark.asyncio
async def test_get_valid_tab_id_no_valid_tabs():
    """Test _get_valid_tab_id when there are no valid tabs."""
    targets = [
        {'type': 'extension', 'url': 'chrome-extension://abc123', 'targetId': 'ext_1'},
        {'type': 'background_page', 'url': 'chrome://background', 'targetId': 'bg_1'},
    ]

    with pytest.raises(exceptions.NoValidTabFound):
        await Browser._get_valid_tab_id(targets)


@pytest.mark.asyncio
async def test_get_valid_tab_id_empty_targets():
    """Test _get_valid_tab_id with empty targets list."""
    targets = []

    with pytest.raises(exceptions.NoValidTabFound):
        await Browser._get_valid_tab_id(targets)


@pytest.mark.asyncio
async def test_get_valid_tab_id_missing_target_id():
    """Test _get_valid_tab_id when valid tab has no targetId."""
    targets = [
        {'type': 'page', 'url': 'https://example.com'},  # No targetId
        {'type': 'extension', 'url': 'chrome-extension://abc123', 'targetId': 'ext_1'},
    ]

    with pytest.raises(exceptions.NoValidTabFound, match='Tab missing targetId'):
        await Browser._get_valid_tab_id(targets)


@pytest.mark.asyncio
async def test_get_valid_tab_id_filters_extensions():
    """Test if _get_valid_tab_id correctly filters extensions."""
    targets = [
        {'type': 'page', 'url': 'chrome-extension://abc123/popup.html', 'targetId': 'ext_page'},
        {'type': 'page', 'url': 'https://example.com', 'targetId': 'valid_tab'},
    ]

    result = await Browser._get_valid_tab_id(targets)
    assert result == 'valid_tab'


# Tests for enable_runtime_events and disable_runtime_events
@pytest.mark.asyncio
async def test_enable_runtime_events(mock_browser):
    """Test enable_runtime_events."""
    await mock_browser.enable_runtime_events()

    mock_browser._connection_handler.execute_command.assert_called_with(RuntimeCommands.enable())


@pytest.mark.asyncio
async def test_disable_runtime_events(mock_browser):
    """Test disable_runtime_events."""
    await mock_browser.disable_runtime_events()

    mock_browser._connection_handler.execute_command.assert_called_with(RuntimeCommands.disable())


@pytest.mark.asyncio
async def test_get_tab_by_target(mock_browser):
    """Test get_tab_by_target creates Tab with correct target info."""
    target_info = {
        'targetId': 'test_target_123',
        'type': 'page',
        'url': 'https://example.com',
    }
    
    tab = await mock_browser.get_tab_by_target(target_info)
    
    assert isinstance(tab, Tab)
    assert tab._target_id == 'test_target_123'


# Tests for continue_request, fail_request and fulfill_request
@pytest.mark.asyncio
async def test_continue_request(mock_browser):
    """Test continue_request with minimal parameters."""
    request_id = 'test_request_123'

    await mock_browser.continue_request(request_id)

    mock_browser._connection_handler.execute_command.assert_called_with(
        FetchCommands.continue_request(
            request_id=request_id,
            url=None,
            method=None,
            post_data=None,
            headers=None,
            intercept_response=None,
        ),
        timeout=60,
    )


@pytest.mark.asyncio
async def test_continue_request_with_all_params(mock_browser):
    """Test continue_request with all parameters."""
    request_id = 'test_request_123'
    url = 'https://modified-example.com'
    method = RequestMethod.POST
    post_data = 'modified_data=test'
    headers = [{'name': 'Authorization', 'value': 'Bearer token123'}]
    intercept_response = True

    await mock_browser.continue_request(
        request_id=request_id,
        url=url,
        method=method,
        post_data=post_data,
        headers=headers,
        intercept_response=intercept_response,
    )

    mock_browser._connection_handler.execute_command.assert_called_with(
        FetchCommands.continue_request(
            request_id=request_id,
            url=url,
            method=method,
            post_data=post_data,
            headers=headers,
            intercept_response=intercept_response,
        ),
        timeout=60,
    )


@pytest.mark.asyncio
async def test_fail_request(mock_browser):
    """Test fail_request."""
    request_id = 'test_request_123'
    error_reason = ErrorReason.FAILED
    await mock_browser.fail_request(request_id, error_reason)

    mock_browser._connection_handler.execute_command.assert_called_with(
        FetchCommands.fail_request(request_id, error_reason), timeout=60
    )


@pytest.mark.asyncio
async def test_fulfill_request(mock_browser):
    """Test fulfill_request with minimal parameters."""
    request_id = 'test_request_123'
    response_code = 200

    await mock_browser.fulfill_request(request_id, response_code)

    mock_browser._connection_handler.execute_command.assert_called_with(
        FetchCommands.fulfill_request(
            request_id=request_id,
            response_code=response_code,
            response_headers=None,
            body=None,
            response_phrase=None,
        ),
        timeout=60,
    )


@pytest.mark.asyncio
async def test_fulfill_request_with_all_params(mock_browser):
    """Test fulfill_request with all parameters."""
    request_id = 'test_request_123'
    response_code = 200
    response_headers = [{'name': 'Content-Type', 'value': 'application/json'}]
    json_response = '{"status": "success", "data": "test"}'
    body = base64.b64encode(json_response.encode('utf-8')).decode('utf-8')
    response_phrase = 'OK'

    await mock_browser.fulfill_request(
        request_id=request_id,
        response_code=response_code,
        response_headers=response_headers,
        body=body,
        response_phrase=response_phrase,
    )

    mock_browser._connection_handler.execute_command.assert_called_with(
        FetchCommands.fulfill_request(
            request_id=request_id,
            response_code=response_code,
            response_headers=response_headers,
            body=body,
            response_phrase=response_phrase,
        ),
        timeout=60,
    )


# Additional test for 'on' with async callback
@pytest.mark.asyncio
async def test_event_registration_with_async_callback(mock_browser):
    """Test async callback registration."""
    mock_browser._connection_handler.register_callback.return_value = 456

    async def async_test_callback(event):
        """Test async callback."""
        return f"Processed event: {event}"

    callback_id = await mock_browser.on('test_async_event', async_test_callback, temporary=False)
    assert callback_id == 456

    mock_browser._connection_handler.register_callback.assert_called_with(
        'test_async_event', ANY, False
    )

    # Verify that callback was registered correctly
    call_args = mock_browser._connection_handler.register_callback.call_args
    registered_callback = call_args[0][1]  # Second argument (callback)

    # The registered callback should be a function
    assert callable(registered_callback)


@pytest.mark.asyncio
async def test_event_registration_sync_callback(mock_browser):
    """Test sync callback registration."""
    mock_browser._connection_handler.register_callback.return_value = 789

    def sync_test_callback(event):
        """Test sync callback."""
        return f"Processed sync event: {event}"

    callback_id = await mock_browser.on('test_sync_event', sync_test_callback, temporary=True)
    assert callback_id == 789

    mock_browser._connection_handler.register_callback.assert_called_with(
        'test_sync_event', ANY, True
    )


# Tests for get_opened_tabs method
@pytest.mark.asyncio
async def test_get_opened_tabs_success(mock_browser):
    """Test get_opened_tabs with multiple valid tabs."""
    # Mock get_targets to return various target types
    mock_targets = [
        {'targetId': 'tab3', 'type': 'page', 'url': 'https://example.com', 'title': 'Example Site'},
        {
            'targetId': 'ext1',
            'type': 'page',
            'url': 'chrome-extension://abc123/popup.html',
            'title': 'Extension Popup',
        },
        {'targetId': 'tab2', 'type': 'page', 'url': 'https://google.com', 'title': 'Google'},
        {
            'targetId': 'bg1',
            'type': 'background_page',
            'url': 'chrome://background',
            'title': 'Background Page',
        },
        {'targetId': 'tab1', 'type': 'page', 'url': 'chrome://newtab/', 'title': 'New Tab'},
    ]

    mock_browser.get_targets = AsyncMock(return_value=mock_targets)

    tabs = await mock_browser.get_opened_tabs()

    # Should return 3 tabs (excluding extension and background_page)
    assert len(tabs) == 3

    # Verify all returned objects are Tab instances
    for tab in tabs:
        assert isinstance(tab, Tab)

    # Verify target IDs are correct (should be in reversed order)
    expected_target_ids = ['tab1', 'tab2', 'tab3']  # reversed order
    actual_target_ids = [tab._target_id for tab in tabs]
    assert actual_target_ids == expected_target_ids

    # Verify get_targets was called
    mock_browser.get_targets.assert_called_once()


@pytest.mark.asyncio
async def test_get_opened_tabs_no_valid_tabs(mock_browser):
    """Test get_opened_tabs when no valid tabs exist."""
    # Mock get_targets to return only non-page targets
    mock_targets = [
        {
            'targetId': 'ext1',
            'type': 'page',
            'url': 'chrome-extension://abc123/popup.html',
            'title': 'Extension Popup',
        },
        {
            'targetId': 'bg1',
            'type': 'background_page',
            'url': 'chrome://background',
            'title': 'Background Page',
        },
        {
            'targetId': 'worker1',
            'type': 'service_worker',
            'url': 'https://example.com/sw.js',
            'title': 'Service Worker',
        },
    ]

    mock_browser.get_targets = AsyncMock(return_value=mock_targets)

    tabs = await mock_browser.get_opened_tabs()

    # Should return empty list
    assert len(tabs) == 0
    assert tabs == []

    mock_browser.get_targets.assert_called_once()


@pytest.mark.asyncio
async def test_get_opened_tabs_empty_targets(mock_browser):
    """Test get_opened_tabs when no targets exist."""
    mock_browser.get_targets = AsyncMock(return_value=[])

    tabs = await mock_browser.get_opened_tabs()

    assert len(tabs) == 0
    assert tabs == []

    mock_browser.get_targets.assert_called_once()


@pytest.mark.asyncio
async def test_get_opened_tabs_filters_extensions(mock_browser):
    """Test that get_opened_tabs correctly filters out extension pages."""
    mock_targets = [
        {'targetId': 'tab1', 'type': 'page', 'url': 'https://example.com', 'title': 'Example Site'},
        {
            'targetId': 'ext1',
            'type': 'page',
            'url': 'chrome-extension://abc123/popup.html',
            'title': 'Extension Popup',
        },
        {
            'targetId': 'ext2',
            'type': 'page',
            'url': 'moz-extension://def456/options.html',
            'title': 'Extension Options',
        },
        {'targetId': 'tab2', 'type': 'page', 'url': 'https://github.com', 'title': 'GitHub'},
    ]

    mock_browser.get_targets = AsyncMock(return_value=mock_targets)

    tabs = await mock_browser.get_opened_tabs()

    # Should return only 2 tabs (excluding extensions)
    assert len(tabs) == 2

    # Verify no extension URLs in results
    for tab in tabs:
        assert 'extension' not in tab._target_id

    # Verify correct target IDs (reversed order)
    expected_target_ids = ['tab2', 'tab1']
    actual_target_ids = [tab._target_id for tab in tabs]
    assert actual_target_ids == expected_target_ids


@pytest.mark.asyncio
async def test_get_opened_tabs_filters_non_page_types(mock_browser):
    """Test that get_opened_tabs only returns 'page' type targets."""
    mock_targets = [
        {'targetId': 'tab1', 'type': 'page', 'url': 'https://example.com', 'title': 'Example Site'},
        {
            'targetId': 'worker1',
            'type': 'service_worker',
            'url': 'https://example.com/sw.js',
            'title': 'Service Worker',
        },
        {
            'targetId': 'shared1',
            'type': 'shared_worker',
            'url': 'https://example.com/shared.js',
            'title': 'Shared Worker',
        },
        {'targetId': 'browser1', 'type': 'browser', 'url': '', 'title': 'Browser Process'},
        {'targetId': 'tab2', 'type': 'page', 'url': 'https://google.com', 'title': 'Google'},
    ]

    mock_browser.get_targets = AsyncMock(return_value=mock_targets)

    tabs = await mock_browser.get_opened_tabs()

    # Should return only 2 tabs (only 'page' type)
    assert len(tabs) == 2

    # Verify all are Tab instances
    for tab in tabs:
        assert isinstance(tab, Tab)

    # Verify correct target IDs (reversed order)
    expected_target_ids = ['tab2', 'tab1']
    actual_target_ids = [tab._target_id for tab in tabs]
    assert actual_target_ids == expected_target_ids


@pytest.mark.asyncio
async def test_get_opened_tabs_order_is_reversed(mock_browser):
    """Test that get_opened_tabs returns tabs in reversed order (most recent first)."""
    mock_targets = [
        {
            'targetId': 'oldest_tab',
            'type': 'page',
            'url': 'https://first.com',
            'title': 'First Tab',
        },
        {
            'targetId': 'middle_tab',
            'type': 'page',
            'url': 'https://second.com',
            'title': 'Second Tab',
        },
        {
            'targetId': 'newest_tab',
            'type': 'page',
            'url': 'https://third.com',
            'title': 'Third Tab',
        },
    ]

    mock_browser.get_targets = AsyncMock(return_value=mock_targets)

    tabs = await mock_browser.get_opened_tabs()

    # Should return in reversed order (newest first)
    expected_order = ['newest_tab', 'middle_tab', 'oldest_tab']
    actual_order = [tab._target_id for tab in tabs]

    assert actual_order == expected_order


@pytest.mark.asyncio
async def test_get_opened_tabs_with_mixed_valid_invalid_targets(mock_browser):
    """Test get_opened_tabs with a mix of valid and invalid targets."""
    mock_targets = [
        {
            'targetId': 'valid_tab1',
            'type': 'page',
            'url': 'https://example.com',
            'title': 'Valid Tab 1',
        },
        {
            'targetId': 'extension_page',
            'type': 'page',
            'url': 'chrome-extension://abc123/popup.html',
            'title': 'Extension Page',
        },
        {
            'targetId': 'service_worker',
            'type': 'service_worker',
            'url': 'https://example.com/sw.js',
            'title': 'Service Worker',
        },
        {
            'targetId': 'valid_tab2',
            'type': 'page',
            'url': 'https://github.com',
            'title': 'Valid Tab 2',
        },
        {
            'targetId': 'background_page',
            'type': 'background_page',
            'url': 'chrome://background',
            'title': 'Background',
        },
        {'targetId': 'valid_tab3', 'type': 'page', 'url': 'chrome://newtab/', 'title': 'New Tab'},
    ]

    mock_browser.get_targets = AsyncMock(return_value=mock_targets)

    tabs = await mock_browser.get_opened_tabs()

    # Should return only 3 valid tabs
    assert len(tabs) == 3

    # Verify correct filtering and order
    expected_target_ids = ['valid_tab3', 'valid_tab2', 'valid_tab1']
    actual_target_ids = [tab._target_id for tab in tabs]
    assert actual_target_ids == expected_target_ids

    # Verify all are Tab instances
    for tab in tabs:
        assert isinstance(tab, Tab)


@pytest.mark.asyncio
async def test_get_opened_tabs_integration_with_new_tab(mock_browser):
    """Test get_opened_tabs integration with new_tab method."""
    # Mock initial targets (empty)
    mock_browser.get_targets = AsyncMock(return_value=[])

    # Initially no tabs
    tabs = await mock_browser.get_opened_tabs()
    assert len(tabs) == 0

    # Mock new_tab creation
    mock_browser._connection_handler.execute_command.return_value = {
        'result': {'targetId': 'new_tab_1'}
    }

    # Create a new tab
    new_tab = await mock_browser.new_tab()
    assert new_tab._target_id == 'new_tab_1'

    # Mock updated targets after tab creation
    mock_browser.get_targets = AsyncMock(
        return_value=[
            {
                'targetId': 'new_tab_1',
                'type': 'page',
                'url': 'https://example.com',
                'title': 'Example',
            }
        ]
    )

    # Now get_opened_tabs should return the new tab
    tabs = await mock_browser.get_opened_tabs()
    assert len(tabs) == 1
    assert tabs[0]._target_id == 'new_tab_1'

    # Without singleton, instance identity can differ but ids should match
    assert tabs[0]._target_id == new_tab._target_id


@pytest.mark.asyncio
async def test_headless_parameter_deprecation_warning(mock_browser):
    mock_browser._connection_handler.ping.return_value = True
    mock_browser._get_valid_tab_id = AsyncMock(return_value='page1')
    
    with pytest.warns(
        DeprecationWarning,
        match="The 'headless' parameter is deprecated and will be removed in a future version"
    ):
        await mock_browser.start(headless=True)
    
    assert mock_browser.options.headless is True
    assert '--headless' in mock_browser.options.arguments


# --- User-Agent Override Tests ---


@pytest.mark.asyncio
async def test_get_user_agent_from_options_found(mock_browser):
    mock_browser.options.add_argument(
        '--user-agent=Mozilla/5.0 (Windows NT 10.0; Win64; x64) Chrome/120.0.6099.109'
    )
    result = mock_browser._get_user_agent_from_options()
    assert result == 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) Chrome/120.0.6099.109'


@pytest.mark.asyncio
async def test_get_user_agent_from_options_not_found(mock_browser):
    result = mock_browser._get_user_agent_from_options()
    assert result is None


@pytest.mark.asyncio
async def test_apply_user_agent_override_no_ua_set(mock_browser):
    tab = MagicMock(spec=Tab)
    tab._execute_command = AsyncMock()

    await mock_browser._apply_user_agent_override(tab)

    tab._execute_command.assert_not_called()


@pytest.mark.asyncio
async def test_apply_user_agent_override_with_ua_set(mock_browser):
    custom_ua = (
        'Mozilla/5.0 (Windows NT 10.0; Win64; x64) '
        'AppleWebKit/537.36 (KHTML, like Gecko) '
        'Chrome/120.0.6099.109 Safari/537.36'
    )
    mock_browser.options.add_argument(f'--user-agent={custom_ua}')

    tab = MagicMock(spec=Tab)
    tab._execute_command = AsyncMock()

    await mock_browser._apply_user_agent_override(tab)

    assert tab._execute_command.call_count == 2

    emulation_call = tab._execute_command.call_args_list[0]
    command = emulation_call[0][0]
    assert command['method'] == 'Emulation.setUserAgentOverride'
    assert command['params']['userAgent'] == custom_ua
    assert command['params']['platform'] == 'Win32'
    assert 'userAgentMetadata' in command['params']

    js_call = tab._execute_command.call_args_list[1]
    js_command = js_call[0][0]
    assert js_command['method'] == 'Page.addScriptToEvaluateOnNewDocument'
    assert "Navigator.prototype, 'vendor'" in js_command['params']['source']
    assert "Navigator.prototype, 'appVersion'" in js_command['params']['source']


@pytest.mark.asyncio
async def test_apply_user_agent_override_metadata_consistency(mock_browser):
    custom_ua = (
        'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) '
        'AppleWebKit/537.36 (KHTML, like Gecko) '
        'Chrome/121.0.6167.85 Safari/537.36'
    )
    mock_browser.options.add_argument(f'--user-agent={custom_ua}')

    tab = MagicMock(spec=Tab)
    tab._execute_command = AsyncMock()

    await mock_browser._apply_user_agent_override(tab)

    emulation_call = tab._execute_command.call_args_list[0]
    command = emulation_call[0][0]
    metadata = command['params']['userAgentMetadata']
    assert metadata['platform'] == 'macOS'
    assert metadata['mobile'] is False
    assert command['params']['platform'] == 'MacIntel'
    brands = metadata['brands']
    brand_names = [b['brand'] for b in brands]
    assert 'Chromium' in brand_names
    assert 'Google Chrome' in brand_names


@pytest.mark.asyncio
async def test_start_applies_user_agent_override(mock_browser):
    custom_ua = (
        'Mozilla/5.0 (Windows NT 10.0; Win64; x64) '
        'Chrome/120.0.6099.109 Safari/537.36'
    )
    mock_browser.options.add_argument(f'--user-agent={custom_ua}')
    mock_browser._connection_handler.ping.return_value = True
    mock_browser._get_valid_tab_id = AsyncMock(return_value='page1')
    mock_browser._apply_user_agent_override = AsyncMock()

    tab = await mock_browser.start()

    mock_browser._apply_user_agent_override.assert_called_once_with(tab)


@pytest.mark.asyncio
async def test_new_tab_applies_user_agent_override(mock_browser):
    custom_ua = 'Mozilla/5.0 Chrome/120.0.6099.109'
    mock_browser.options.add_argument(f'--user-agent={custom_ua}')
    mock_browser._connection_handler.execute_command = AsyncMock(
        return_value={'result': {'targetId': 'new_tab_1'}}
    )
    mock_browser._apply_user_agent_override = AsyncMock()

    tab = await mock_browser.new_tab()

    mock_browser._apply_user_agent_override.assert_called_once_with(tab)


================================================
FILE: tests/test_browser/test_browser_chrome.py
================================================
import json
import os
from unittest.mock import MagicMock, patch

import pytest

from pydoll.browser.chromium.chrome import Chrome
from pydoll.browser.options import ChromiumOptions
from pydoll.exceptions import InvalidBrowserPath, UnsupportedOS, InvalidConnectionPort


class TestChromeInitialization:
    """Tests for Chrome class initialization."""

    def test_chrome_initialization_default_options(self):
        """Test Chrome initialization with default options."""
        with patch.multiple(
            Chrome,
            _get_default_binary_location=MagicMock(return_value='/fake/chrome'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            chrome = Chrome()
            
            assert isinstance(chrome.options, ChromiumOptions)
            assert chrome._connection_port in range(9223, 9323)

    def test_chrome_initialization_custom_options(self):
        """Test Chrome initialization with custom options."""
        custom_options = ChromiumOptions()
        custom_options.add_argument('--disable-web-security')
        custom_options.binary_location = '/custom/chrome/path'
        
        with patch.multiple(
            Chrome,
            _get_default_binary_location=MagicMock(return_value='/fake/chrome'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            chrome = Chrome(options=custom_options)
            
            assert chrome.options == custom_options
            assert '--disable-web-security' in chrome.options.arguments
            assert chrome.options.binary_location == '/custom/chrome/path'

    def test_chrome_initialization_custom_port(self):
        """Test Chrome initialization with custom port."""
        custom_port = 9999
        
        with patch.multiple(
            Chrome,
            _get_default_binary_location=MagicMock(return_value='/fake/chrome'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            chrome = Chrome(connection_port=custom_port)
            
            assert chrome._connection_port == custom_port

    def test_chrome_initialization_both_custom(self):
        """Test Chrome initialization with both custom options and port."""
        custom_options = ChromiumOptions()
        custom_options.add_argument('--headless')
        custom_port = 8888
        
        with patch.multiple(
            Chrome,
            _get_default_binary_location=MagicMock(return_value='/fake/chrome'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            chrome = Chrome(options=custom_options, connection_port=custom_port)
            
            assert chrome.options == custom_options
            assert chrome._connection_port == custom_port
            assert '--headless' in chrome.options.arguments


class TestChromeDefaultBinaryLocation:
    """Tests for Chrome default binary location detection."""

    @pytest.mark.parametrize(
        'os_name, expected_paths',
        [
            (
                'Windows',
                [
                    r'C:\Program Files\Google\Chrome\Application\chrome.exe',
                    r'C:\Program Files (x86)\Google\Chrome\Application\chrome.exe',
                ]
            ),
            (
                'Linux',
                ['/usr/bin/google-chrome', '/usr/bin/google-chrome-stable']
            ),
            (
                'Darwin',
                ['/Applications/Google Chrome.app/Contents/MacOS/Google Chrome']
            ),
        ],
    )
    @patch('pydoll.browser.chromium.chrome.validate_browser_paths')
    @patch('platform.system')
    def test_get_default_binary_location_success(
        self, mock_platform_system, mock_validate_browser_paths, os_name, expected_paths
    ):
        """Test successful default binary detection for different operating systems."""
        mock_platform_system.return_value = os_name
        expected_path = expected_paths[0]  # First path in the list
        mock_validate_browser_paths.return_value = expected_path
        
        result = Chrome._get_default_binary_location()
        
        mock_platform_system.assert_called_once()
        mock_validate_browser_paths.assert_called_once_with(expected_paths)
        assert result == expected_path

    @patch('platform.system')
    def test_get_default_binary_location_unsupported_os(self, mock_platform_system):
        """Test exception for unsupported operating system."""
        mock_platform_system.return_value = 'FreeBSD'
        
        with pytest.raises(UnsupportedOS, match='Unsupported OS: FreeBSD'):
            Chrome._get_default_binary_location()

    @patch('platform.system')
    def test_get_default_binary_location_unknown_os(self, mock_platform_system):
        """Test exception for unknown operating system."""
        mock_platform_system.return_value = 'UnknownOS'
        
        with pytest.raises(UnsupportedOS, match='Unsupported OS: UnknownOS'):
            Chrome._get_default_binary_location()

    @patch('pydoll.browser.chromium.chrome.validate_browser_paths')
    @patch('platform.system')
    def test_get_default_binary_location_validation_error(
        self, mock_platform_system, mock_validate_browser_paths
    ):
        """Test when path validation fails."""
        mock_platform_system.return_value = 'Linux'
        mock_validate_browser_paths.side_effect = InvalidBrowserPath('Chrome executable not found')
        
        with pytest.raises(InvalidBrowserPath, match='Chrome executable not found'):
            Chrome._get_default_binary_location()

    @patch('pydoll.browser.chromium.chrome.validate_browser_paths')
    @patch('platform.system')
    def test_get_default_binary_location_windows_fallback(
        self, mock_platform_system, mock_validate_browser_paths
    ):
        """Test fallback for different paths on Windows."""
        mock_platform_system.return_value = 'Windows'
        expected_path = r'C:\Program Files (x86)\Google\Chrome\Application\chrome.exe'
        mock_validate_browser_paths.return_value = expected_path
        
        result = Chrome._get_default_binary_location()
        
        expected_paths = [
            r'C:\Program Files\Google\Chrome\Application\chrome.exe',
            r'C:\Program Files (x86)\Google\Chrome\Application\chrome.exe',
        ]
        mock_validate_browser_paths.assert_called_once_with(expected_paths)
        assert result == expected_path


class TestChromeOptionsManager:
    """Tests for ChromiumOptionsManager integration."""

    def test_options_manager_creation(self):
        """Test options manager creation."""
        custom_options = ChromiumOptions()
        custom_options.add_argument('--no-sandbox')
        
        with patch.multiple(
            Chrome,
            _get_default_binary_location=MagicMock(return_value='/fake/chrome'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            chrome = Chrome(options=custom_options)
            
            # Verify that options were configured correctly
            assert chrome.options == custom_options
            assert '--no-sandbox' in chrome.options.arguments

    def test_options_manager_with_none_options(self):
        """Test options manager creation with None options."""
        with patch.multiple(
            Chrome,
            _get_default_binary_location=MagicMock(return_value='/fake/chrome'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            chrome = Chrome(options=None)
            
            # Verify that default options were created
            assert isinstance(chrome.options, ChromiumOptions)


class TestChromeInheritance:
    """Tests to verify correct inheritance from Browser class."""

    def test_chrome_inherits_from_browser(self):
        """Test if Chrome correctly inherits from Browser."""
        from pydoll.browser.chromium.base import Browser
        
        with patch.multiple(
            Chrome,
            _get_default_binary_location=MagicMock(return_value='/fake/chrome'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            chrome = Chrome()
            
            assert isinstance(chrome, Browser)
            assert hasattr(chrome, 'start')
            assert hasattr(chrome, 'stop')
            assert hasattr(chrome, 'new_tab')

    def test_chrome_overrides_get_default_binary_location(self):
        """Test if Chrome overrides the _get_default_binary_location method."""
        # Verify that the method is static and exists
        assert hasattr(Chrome, '_get_default_binary_location')
        assert callable(Chrome._get_default_binary_location)
        
        # Verify that it's different from the base implementation
        from pydoll.browser.chromium.base import Browser
        assert Chrome._get_default_binary_location != Browser._get_default_binary_location


class TestChromeEdgeCases:
    """Tests for edge cases and special situations."""

    def test_chrome_with_empty_options(self):
        """Test Chrome with empty options."""
        empty_options = ChromiumOptions()
        
        with patch.multiple(
            Chrome,
            _get_default_binary_location=MagicMock(return_value='/fake/chrome'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            chrome = Chrome(options=empty_options)
            
            assert chrome.options == empty_options
            assert len(chrome.options.arguments) >= 0  # May have default arguments

    def test_chrome_with_zero_port(self):
        """Test Chrome with zero port (should generate random port since 0 is falsy)."""
        with patch.multiple(
            Chrome,
            _get_default_binary_location=MagicMock(return_value='/fake/chrome'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            chrome = Chrome(connection_port=0)
            
            # Port 0 is falsy, so should generate a random port
            assert chrome._connection_port in range(9223, 9323)

    def test_chrome_with_negative_port(self):
        """Test Chrome with negative port (should raise InvalidConnectionPort)."""
        with patch.multiple(
            Chrome,
            _get_default_binary_location=MagicMock(return_value='/fake/chrome'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            with pytest.raises(InvalidConnectionPort):
                Chrome(connection_port=-1)


class TestChromeIntegration:
    """Integration tests to verify components working together."""

    def test_chrome_full_initialization_flow(self):
        """Test complete Chrome initialization flow."""
        custom_options = ChromiumOptions()
        custom_options.add_argument('--disable-gpu')
        custom_options.add_argument('--no-sandbox')
        custom_options.browser_preferences = {
        "download": {"directory_upgrade": True},
        }
        custom_options.set_default_download_directory('/tmp/all')
        custom_options.block_notifications = True
        custom_options.binary_location = '/custom/chrome'
        custom_port = 9876
        
        with patch.multiple(
            Chrome,
            _get_default_binary_location=MagicMock(return_value='/fake/chrome'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ) as mock_process_manager, patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ) as mock_temp_manager, patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ) as mock_connection, patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ) as mock_proxy_manager:
            
            chrome = Chrome(options=custom_options, connection_port=custom_port)
            chrome._setup_user_dir()
            with open(
                os.path.join(chrome._temp_directory_manager._temp_dirs[0].name, 'Default', 'Preferences'), 'r'
            ) as json_file:
                preferences = json.loads(json_file.read())
            assert preferences == custom_options.browser_preferences

            # Verify correct initialization
            assert chrome.options == custom_options
            assert chrome._connection_port == custom_port
            assert '--disable-gpu' in chrome.options.arguments
            assert '--no-sandbox' in chrome.options.arguments
            assert chrome.options.binary_location == '/custom/chrome'
            
            # Verify that managers were created
            assert chrome._browser_process_manager is not None
            assert chrome._temp_directory_manager is not None
            assert chrome._connection_handler is not None
            assert chrome._proxy_manager is not None

    def test_chrome_options_initialization_flow(self):
        """Test Chrome options initialization flow."""
        with patch.multiple(
            Chrome,
            _get_default_binary_location=MagicMock(return_value='/fake/chrome'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            # Test with None options (should create default options)
            chrome = Chrome(options=None)
            assert isinstance(chrome.options, ChromiumOptions)
            
            # Test with custom options
            custom_options = ChromiumOptions()
            custom_options.add_argument('--test-arg')
            chrome2 = Chrome(options=custom_options)
            assert chrome2.options == custom_options
            assert '--test-arg' in chrome2.options.arguments

    @pytest.mark.asyncio
    async def test_chrome_user_data_dir_and_preferences(self, tmp_path):
        """Test Chrome with user data directory and preferences."""
        user_data_dir = tmp_path / 'chrome_profile'
        user_data_dir.mkdir()
        
        prefs_dir = user_data_dir / 'Default'
        prefs_dir.mkdir()
        prefs_file = prefs_dir / 'Preferences'
        
        initial_prefs = {
            'profile': {
                'exit_type': 'Normal',
                'exited_cleanly': True
            },
            'test_pref': 'initial_value'
        }
        
        prefs_file.write_text(json.dumps(initial_prefs), encoding='utf-8')
        
        custom_options = ChromiumOptions()
        custom_options.add_argument(f'--user-data-dir={user_data_dir}')
        custom_options.browser_preferences = {
            'test_pref': 'new_value',
            'new_pref': 'some_value'
        }
        custom_options.prompt_for_download = False # ok
        with patch.multiple(
            Chrome,
            _get_default_binary_location=MagicMock(return_value='/fake/chrome'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            async with Chrome(options=custom_options) as chrome:
                chrome._setup_user_dir()
                assert f'--user-data-dir={user_data_dir}' in chrome.options.arguments

                with open(prefs_file, 'r', encoding='utf-8') as f:
                    updated_prefs = json.load(f)
                assert updated_prefs['test_pref'] == 'new_value'
                assert updated_prefs['new_pref'] == 'some_value'
                
                assert updated_prefs['profile']['exit_type'] == 'Normal'
                assert updated_prefs['profile']['exited_cleanly'] is True
                backup_file = user_data_dir / 'Default' / 'Preferences.backup'
                assert backup_file.exists()
                with open(backup_file, 'r', encoding='utf-8') as f:
                    backup_prefs = json.load(f)
                assert backup_prefs == initial_prefs
            with open(prefs_file, 'r', encoding='utf-8') as f:
                final_prefs = json.load(f)
            assert final_prefs == initial_prefs

    @pytest.mark.asyncio
    async def test_chrome_user_data_dir_with_invalid_json_preferences(self, tmp_path):
        """Test Chrome with user data directory containing invalid JSON preferences."""
        user_data_dir = tmp_path / 'chrome_profile'
        user_data_dir.mkdir()
        
        prefs_dir = user_data_dir / 'Default'
        prefs_dir.mkdir()
        prefs_file = prefs_dir / 'Preferences'
        
        # Write invalid JSON to the Preferences file
        invalid_json = '{ "profile": { "exit_type": "Normal", "exited_cleanly": true, } }' # trailing comma makes it invalid
        prefs_file.write_text(invalid_json, encoding='utf-8')
        
        custom_options = ChromiumOptions()
        custom_options.add_argument(f'--user-data-dir={user_data_dir}')
        custom_options.browser_preferences = {
            'test_pref': 'new_value',
            'new_pref': 'some_value'
        }
        custom_options.prompt_for_download = False
        
        with patch.multiple(
            Chrome,
            _get_default_binary_location=MagicMock(return_value='/fake/chrome'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            async with Chrome(options=custom_options) as chrome:
                chrome._setup_user_dir()
                assert f'--user-data-dir={user_data_dir}' in chrome.options.arguments

                # The invalid JSON should be handled gracefully by suppress(json.JSONDecodeError)
                # and the preferences should be written with only the new preferences
                with open(prefs_file, 'r', encoding='utf-8') as f:
                    updated_prefs = json.load(f)
                assert updated_prefs['test_pref'] == 'new_value'
                assert updated_prefs['new_pref'] == 'some_value'
                
                # The original invalid JSON should be backed up
                backup_file = user_data_dir / 'Default' / 'Preferences.backup'
                assert backup_file.exists()
                with open(backup_file, 'r', encoding='utf-8') as f:
                    backup_content = f.read()
                assert backup_content == invalid_json


================================================
FILE: tests/test_browser/test_browser_edge.py
================================================
import platform
from unittest.mock import MagicMock, patch

import pytest

from pydoll.browser.chromium.edge import Edge
from pydoll.browser.managers import ChromiumOptionsManager
from pydoll.browser.options import ChromiumOptions
from pydoll.exceptions import UnsupportedOS, InvalidBrowserPath, InvalidConnectionPort


class TestEdgeInitialization:
    """Tests for Edge class initialization."""

    def test_edge_initialization_default_options(self):
        """Test Edge initialization with default options."""
        with patch.multiple(
            Edge,
            _get_default_binary_location=MagicMock(return_value='/fake/edge'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            edge = Edge()
            
            assert isinstance(edge.options, ChromiumOptions)
            assert edge._connection_port in range(9223, 9323)

    def test_edge_initialization_custom_options(self):
        """Test Edge initialization with custom options."""
        custom_options = ChromiumOptions()
        custom_options.add_argument('--disable-web-security')
        custom_options.binary_location = '/custom/edge/path'
        
        with patch.multiple(
            Edge,
            _get_default_binary_location=MagicMock(return_value='/fake/edge'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            edge = Edge(options=custom_options)
            
            assert edge.options == custom_options
            assert '--disable-web-security' in edge.options.arguments
            assert edge.options.binary_location == '/custom/edge/path'

    def test_edge_initialization_custom_port(self):
        """Test Edge initialization with custom port."""
        custom_port = 9999
        
        with patch.multiple(
            Edge,
            _get_default_binary_location=MagicMock(return_value='/fake/edge'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            edge = Edge(connection_port=custom_port)
            
            assert edge._connection_port == custom_port

    def test_edge_initialization_both_custom(self):
        """Test Edge initialization with both custom options and port."""
        custom_options = ChromiumOptions()
        custom_options.add_argument('--headless')
        custom_port = 8888
        
        with patch.multiple(
            Edge,
            _get_default_binary_location=MagicMock(return_value='/fake/edge'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            edge = Edge(options=custom_options, connection_port=custom_port)
            
            assert edge.options == custom_options
            assert edge._connection_port == custom_port
            assert '--headless' in edge.options.arguments


class TestEdgeDefaultBinaryLocation:
    """Tests for Edge default binary location detection."""

    @pytest.mark.parametrize(
        'os_name, expected_paths',
        [
            (
                'Windows',
                [
                    r'C:\Program Files\Microsoft\Edge\Application\msedge.exe',
                    r'C:\Program Files (x86)\Microsoft\Edge\Application\msedge.exe',
                ]
            ),
            (
                'Linux',
                ['/usr/bin/microsoft-edge']
            ),
            (
                'Darwin',
                ['/Applications/Microsoft Edge.app/Contents/MacOS/Microsoft Edge']
            ),
        ],
    )
    @patch('pydoll.browser.chromium.edge.validate_browser_paths')
    @patch('platform.system')
    def test_get_default_binary_location_success(
        self, mock_platform_system, mock_validate_browser_paths, os_name, expected_paths
    ):
        """Test successful default binary detection for different operating systems."""
        mock_platform_system.return_value = os_name
        expected_path = expected_paths[0]  # First path in the list
        mock_validate_browser_paths.return_value = expected_path
        
        result = Edge._get_default_binary_location()
        
        mock_platform_system.assert_called_once()
        mock_validate_browser_paths.assert_called_once_with(expected_paths)
        assert result == expected_path

    @patch('platform.system')
    def test_get_default_binary_location_unsupported_os(self, mock_platform_system):
        """Test exception for unsupported operating system."""
        mock_platform_system.return_value = 'FreeBSD'
        
        with pytest.raises(UnsupportedOS):
            Edge._get_default_binary_location()

    @patch('platform.system')
    def test_get_default_binary_location_unknown_os(self, mock_platform_system):
        """Test exception for unknown operating system."""
        mock_platform_system.return_value = 'UnknownOS'
        
        with pytest.raises(UnsupportedOS):
            Edge._get_default_binary_location()

    @patch('pydoll.browser.chromium.edge.validate_browser_paths')
    @patch('platform.system')
    def test_get_default_binary_location_validation_error(
        self, mock_platform_system, mock_validate_browser_paths
    ):
        """Test when path validation fails."""
        mock_platform_system.return_value = 'Linux'
        mock_validate_browser_paths.side_effect = InvalidBrowserPath('Edge executable not found')
        
        with pytest.raises(InvalidBrowserPath, match='Edge executable not found'):
            Edge._get_default_binary_location()

    @patch('pydoll.browser.chromium.edge.validate_browser_paths')
    @patch('platform.system')
    def test_get_default_binary_location_windows_fallback(
        self, mock_platform_system, mock_validate_browser_paths
    ):
        """Test fallback for different paths on Windows."""
        mock_platform_system.return_value = 'Windows'
        expected_path = r'C:\Program Files (x86)\Microsoft\Edge\Application\msedge.exe'
        mock_validate_browser_paths.return_value = expected_path
        
        result = Edge._get_default_binary_location()
        
        expected_paths = [
            r'C:\Program Files\Microsoft\Edge\Application\msedge.exe',
            r'C:\Program Files (x86)\Microsoft\Edge\Application\msedge.exe',
        ]
        mock_validate_browser_paths.assert_called_once_with(expected_paths)
        assert result == expected_path

    @patch('pydoll.browser.chromium.edge.validate_browser_paths')
    @patch('platform.system')
    def test_get_default_binary_location_linux_path(
        self, mock_platform_system, mock_validate_browser_paths
    ):
        """Test Linux-specific Edge path."""
        mock_platform_system.return_value = 'Linux'
        expected_path = '/usr/bin/microsoft-edge'
        mock_validate_browser_paths.return_value = expected_path
        
        result = Edge._get_default_binary_location()
        
        mock_validate_browser_paths.assert_called_once_with(['/usr/bin/microsoft-edge'])
        assert result == expected_path

    @patch('pydoll.browser.chromium.edge.validate_browser_paths')
    @patch('platform.system')
    def test_get_default_binary_location_macos_path(
        self, mock_platform_system, mock_validate_browser_paths
    ):
        """Test macOS-specific Edge path."""
        mock_platform_system.return_value = 'Darwin'
        expected_path = '/Applications/Microsoft Edge.app/Contents/MacOS/Microsoft Edge'
        mock_validate_browser_paths.return_value = expected_path
        
        result = Edge._get_default_binary_location()
        
        mock_validate_browser_paths.assert_called_once_with([expected_path])
        assert result == expected_path


class TestEdgeOptionsManager:
    """Tests for ChromiumOptionsManager integration."""

    def test_options_manager_creation(self):
        """Test options manager creation."""
        custom_options = ChromiumOptions()
        custom_options.add_argument('--no-sandbox')
        
        with patch.multiple(
            Edge,
            _get_default_binary_location=MagicMock(return_value='/fake/edge'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            edge = Edge(options=custom_options)
            
            # Verify that options were configured correctly
            assert edge.options == custom_options
            assert '--no-sandbox' in edge.options.arguments

    def test_options_manager_with_none_options(self):
        """Test options manager creation with None options."""
        with patch.multiple(
            Edge,
            _get_default_binary_location=MagicMock(return_value='/fake/edge'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            edge = Edge(options=None)
            
            # Verify that default options were created
            assert isinstance(edge.options, ChromiumOptions)


class TestEdgeInheritance:
    """Tests to verify correct inheritance from Browser class."""

    def test_edge_inherits_from_browser(self):
        """Test if Edge correctly inherits from Browser."""
        from pydoll.browser.chromium.base import Browser
        
        with patch.multiple(
            Edge,
            _get_default_binary_location=MagicMock(return_value='/fake/edge'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            edge = Edge()
            
            assert isinstance(edge, Browser)
            assert hasattr(edge, 'start')
            assert hasattr(edge, 'stop')
            assert hasattr(edge, 'new_tab')

    def test_edge_overrides_get_default_binary_location(self):
        """Test if Edge overrides the _get_default_binary_location method."""
        # Verify that the method is static and exists
        assert hasattr(Edge, '_get_default_binary_location')
        assert callable(Edge._get_default_binary_location)
        
        # Verify that it's different from the base implementation
        from pydoll.browser.chromium.base import Browser
        assert Edge._get_default_binary_location != Browser._get_default_binary_location

    def test_edge_uses_chromium_options_manager(self):
        """Test if Edge uses ChromiumOptionsManager like Chrome."""
        with patch.multiple(
            Edge,
            _get_default_binary_location=MagicMock(return_value='/fake/edge'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            edge = Edge()
            
            # Edge should use the same options type as Chrome since it's Chromium-based
            assert isinstance(edge.options, ChromiumOptions)


class TestEdgeEdgeCases:
    """Tests for edge cases and special situations."""

    def test_edge_with_empty_options(self):
        """Test Edge with empty options."""
        empty_options = ChromiumOptions()
        
        with patch.multiple(
            Edge,
            _get_default_binary_location=MagicMock(return_value='/fake/edge'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            edge = Edge(options=empty_options)
            
            assert edge.options == empty_options
            assert len(edge.options.arguments) >= 0  # May have default arguments

    def test_edge_with_zero_port(self):
        """Test Edge with zero port (should generate random port since 0 is falsy)."""
        with patch.multiple(
            Edge,
            _get_default_binary_location=MagicMock(return_value='/fake/edge'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            edge = Edge(connection_port=0)
            
            # Port 0 is falsy, so should generate a random port
            assert edge._connection_port in range(9223, 9323)

    def test_edge_with_negative_port(self):
        """Test Edge with negative port (should raise InvalidConnectionPort)."""
        with patch.multiple(
            Edge,
            _get_default_binary_location=MagicMock(return_value='/fake/edge'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            with pytest.raises(InvalidConnectionPort):
                Edge(connection_port=-1)

    def test_edge_with_edge_specific_arguments(self):
        """Test Edge with Edge-specific command line arguments."""
        custom_options = ChromiumOptions()
        custom_options.add_argument('--enable-features=msEdgeEnhancedSecurity')
        custom_options.add_argument('--edge-webview-enable-builtin-background-extensions')
        
        with patch.multiple(
            Edge,
            _get_default_binary_location=MagicMock(return_value='/fake/edge'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            edge = Edge(options=custom_options)
            
            assert '--enable-features=msEdgeEnhancedSecurity' in edge.options.arguments
            assert '--edge-webview-enable-builtin-background-extensions' in edge.options.arguments


class TestEdgeIntegration:
    """Integration tests to verify components working together."""

    def test_edge_full_initialization_flow(self):
        """Test complete Edge initialization flow."""
        custom_options = ChromiumOptions()
        custom_options.add_argument('--disable-gpu')
        custom_options.add_argument('--no-sandbox')
        custom_options.binary_location = '/custom/edge'
        custom_port = 9876
        
        with patch.multiple(
            Edge,
            _get_default_binary_location=MagicMock(return_value='/fake/edge'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ) as mock_process_manager, patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ) as mock_temp_manager, patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ) as mock_connection, patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ) as mock_proxy_manager:
            
            edge = Edge(options=custom_options, connection_port=custom_port)
            
            # Verify correct initialization
            assert edge.options == custom_options
            assert edge._connection_port == custom_port
            assert '--disable-gpu' in edge.options.arguments
            assert '--no-sandbox' in edge.options.arguments
            assert edge.options.binary_location == '/custom/edge'
            
            # Verify that managers were created
            assert edge._browser_process_manager is not None
            assert edge._temp_directory_manager is not None
            assert edge._connection_handler is not None
            assert edge._proxy_manager is not None

    def test_edge_options_initialization_flow(self):
        """Test Edge options initialization flow."""
        with patch.multiple(
            Edge,
            _get_default_binary_location=MagicMock(return_value='/fake/edge'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            # Test with None options (should create default options)
            edge = Edge(options=None)
            assert isinstance(edge.options, ChromiumOptions)
            
            # Test with custom options
            custom_options = ChromiumOptions()
            custom_options.add_argument('--test-arg')
            edge2 = Edge(options=custom_options)
            assert edge2.options == custom_options
            assert '--test-arg' in edge2.options.arguments

    def test_edge_vs_chrome_compatibility(self):
        """Test that Edge and Chrome use compatible interfaces."""
        from pydoll.browser.chromium.chrome import Chrome
        
        with patch.multiple(
            Edge,
            _get_default_binary_location=MagicMock(return_value='/fake/edge'),
        ), patch.multiple(
            Chrome,
            _get_default_binary_location=MagicMock(return_value='/fake/chrome'),
        ), patch(
            'pydoll.browser.managers.browser_process_manager.BrowserProcessManager',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.temp_dir_manager.TempDirectoryManager',
            autospec=True,
        ), patch(
            'pydoll.connection.connection_handler.ConnectionHandler',
            autospec=True,
        ), patch(
            'pydoll.browser.managers.proxy_manager.ProxyManager',
            autospec=True,
        ):
            edge = Edge()
            chrome = Chrome()
            
            # Both should have the same interface
            assert type(edge.options) == type(chrome.options)
            assert hasattr(edge, 'start') and hasattr(chrome, 'start')
            assert hasattr(edge, 'stop') and hasattr(chrome, 'stop')
            assert hasattr(edge, 'new_tab') and hasattr(chrome, 'new_tab')


================================================
FILE: tests/test_browser/test_browser_options.py
================================================
import pytest

from pydoll.browser.interfaces import Options as OptionsInterface
from pydoll.browser.options import ChromiumOptions as Options
from pydoll.constants import PageLoadState
from pydoll.exceptions import (
    ArgumentAlreadyExistsInOptions,
    ArgumentNotFoundInOptions,
    WrongPrefsDict,
)


def test_initial_arguments():
    options = Options()
    assert options.arguments == []


def test_initial_binary_location():
    options = Options()
    assert not options.binary_location


def test_set_binary_location():
    options = Options()
    options.binary_location = '/path/to/browser'
    assert options.binary_location == '/path/to/browser'


def test_set_start_timeout():
    options = Options()
    options.start_timeout = 30
    assert options.start_timeout == 30


def test_initial_page_load_state():
    options = Options()
    assert options.page_load_state == PageLoadState.COMPLETE


def test_set_page_load_state():
    options = Options()
    options.page_load_state = PageLoadState.INTERACTIVE
    assert options.page_load_state == PageLoadState.INTERACTIVE


def test_add_argument():
    options = Options()
    options.add_argument('--headless')
    assert options.arguments == ['--headless']


def test_add_duplicate_argument():
    options = Options()
    options.add_argument('--headless')
    with pytest.raises(ArgumentAlreadyExistsInOptions, match='Argument already exists: --headless'):
        options.add_argument('--headless')

def test_remove_argument():
    options = Options()
    options.add_argument('--headless')
    options.remove_argument('--headless')
    assert options.arguments == []

def test_remove_argument_not_exists():
    options = Options()
    with pytest.raises(ArgumentNotFoundInOptions, match='Argument not found: --headless'):
        options.remove_argument('--headless')

def test_add_multiple_arguments():
    options = Options()
    options.add_argument('--headless')
    options.add_argument('--no-sandbox')
    assert options.arguments == ['--headless', '--no-sandbox']


def test_set_default_download_directory():
    options = Options()
    options.set_default_download_directory('/tmp/downloads')
    assert options.browser_preferences['download']['default_directory'] == '/tmp/downloads'


def test_set_prompt_for_download():
    options = Options()
    options.prompt_for_download = False
    assert options.browser_preferences['download']['prompt_for_download'] is False
    assert options.prompt_for_download is False


def test_set_block_popups():
    options = Options()
    options.block_popups = True
    assert options.browser_preferences['profile']['default_content_setting_values']['popups'] == 0
    assert options.block_popups == True


def test_set_password_manager_enabled():
    options = Options()
    options.password_manager_enabled = False
    assert options.browser_preferences['profile']['password_manager_enabled'] is False
    assert options.password_manager_enabled is False


def test_set_block_notifications():
    options = Options()
    options.block_notifications = True
    assert (
        options.browser_preferences['profile']['default_content_setting_values']['notifications']
        == 2
    )
    assert options.block_notifications == True


def test_set_allow_automatic_downloads():
    options = Options()
    options.allow_automatic_downloads = True
    assert (
        options.browser_preferences['profile']['default_content_setting_values'][
            'automatic_downloads'
        ]
        == 1
    )
    assert options.allow_automatic_downloads == True


def test_set_open_pdf_externally():
    options = Options()
    options.open_pdf_externally = True
    assert options.browser_preferences['plugins']['always_open_pdf_externally'] is True
    assert options.open_pdf_externally is True


def test_set_accept_languages():
    options = Options()
    options.set_accept_languages('pt-BR,pt,en-US,en')
    assert options.browser_preferences['intl']['accept_languages'] == 'pt-BR,pt,en-US,en'


def test_set_multiple_prefs():
    options = Options()
    options.set_default_download_directory('/tmp/all')
    options.prompt_for_download = False
    options.block_popups = True
    options.password_manager_enabled = False
    options.block_notifications = True
    options.allow_automatic_downloads = True
    options.open_pdf_externally = True
    options.set_accept_languages('pt-BR,pt,en-US,en')

    assert options.browser_preferences['download']['default_directory'] == '/tmp/all'
    assert options.browser_preferences['download']['prompt_for_download'] is False
    assert options.browser_preferences['profile']['default_content_setting_values']['popups'] == 0
    assert options.browser_preferences['profile']['password_manager_enabled'] is False
    assert (
        options.browser_preferences['profile']['default_content_setting_values']['notifications']
        == 2
    )
    assert (
        options.browser_preferences['profile']['default_content_setting_values'][
            'automatic_downloads'
        ]
        == 1
    )
    assert options.browser_preferences['plugins']['always_open_pdf_externally'] is True
    assert options.browser_preferences['intl']['accept_languages'] == 'pt-BR,pt,en-US,en'


def test_dict_prefs():
    options = Options()
    options.browser_preferences = {
        "download": {"directory_upgrade": True},
    }
    assert options.browser_preferences['download']['directory_upgrade'] == True


def test_not_dict_prefs_error():
    with pytest.raises(ValueError, match='The experimental options value must be a dict.'):
        options = Options()
        options.browser_preferences = ["download", "directory_upgrade"]


def test_wrong_dict_prefs_error():
    with pytest.raises(WrongPrefsDict):
        options = Options()
        options.browser_preferences = {
            'prefs': {
                "download": {"directory_upgrade": True},
            }
        }

def test_set_arguments():
    options = Options()
    options.arguments = ['--headless']
    assert options.arguments == ['--headless']

def test_get_pref_path():
    options = Options()
    options.set_default_download_directory('/tmp/downloads')
    assert options._get_pref_path(['download', 'default_directory']) == '/tmp/downloads'


def test_get_pref_path_none():
    options = Options()
    assert options._get_pref_path(['download', 'default_directory']) is None


def test_options_interface_enforcement():
    with pytest.raises(TypeError):
        OptionsInterface()

    class IncompleteOptions(OptionsInterface):
        pass

    with pytest.raises(TypeError):
        IncompleteOptions()

    class CompleteOptions(OptionsInterface):
        @property
        def arguments(self):
            return []

        @property
        def binary_location(self):
            return ''

        @property
        def start_timeout(self):
            return 0

        def add_argument(self, argument):
            pass

        @property
        def browser_preferences(self):
            return {}

        @property
        def headless(self):
            return False

        @property
        def page_load_state(self):
            return PageLoadState.COMPLETE

        @page_load_state.setter
        def page_load_state(self, state):
            pass

    CompleteOptions()

def test_set_headless():
    options = Options()
    options.headless = True
    assert options.headless is True
    assert options.arguments == ['--headless']

def test_set_headless_false():
    options = Options()
    options.headless = True
    assert options.headless is True
    assert options.arguments == ['--headless']
    options.headless = False
    assert options.headless is False
    assert options.arguments == []

def test_set_headless_true_twice():
    options = Options()
    options.headless = True
    assert options.headless is True
    assert options.arguments == ['--headless']
    options.headless = True
    assert options.headless is True
    assert options.arguments == ['--headless']

def test_set_headless_false_twice():
    options = Options()
    options.headless = False
    assert options.headless is False
    assert options.arguments == []
    options.headless = False
    assert options.headless is False
    assert options.arguments == []

def test_set_webrtc_leak_protection():
    options = Options()
    options.webrtc_leak_protection = True
    assert options.webrtc_leak_protection is True
    assert options.arguments == ['--force-webrtc-ip-handling-policy=disable_non_proxied_udp']

def test_set_webrtc_leak_protection_false():
    options = Options()
    options.webrtc_leak_protection = True
    assert options.webrtc_leak_protection is True
    assert options.arguments == ['--force-webrtc-ip-handling-policy=disable_non_proxied_udp']
    options.webrtc_leak_protection = False
    assert options.webrtc_leak_protection is False
    assert options.arguments == []

def test_set_webrtc_leak_protection_true_twice():
    options = Options()
    options.webrtc_leak_protection = True
    assert options.webrtc_leak_protection is True
    assert options.arguments == ['--force-webrtc-ip-handling-policy=disable_non_proxied_udp']
    options.webrtc_leak_protection = True
    assert options.webrtc_leak_protection is True
    assert options.arguments == ['--force-webrtc-ip-handling-policy=disable_non_proxied_udp']

def test_set_webrtc_leak_protection_false_twice():
    options = Options()
    options.webrtc_leak_protection = False
    assert options.webrtc_leak_protection is False
    assert options.arguments == []
    options.webrtc_leak_protection = False
    assert options.webrtc_leak_protection is False
    assert options.arguments == []


================================================
FILE: tests/test_browser/test_browser_tab.py
================================================
import base64
import asyncio
import pytest
import pytest_asyncio
import uuid
from unittest.mock import AsyncMock, MagicMock, Mock, patch, ANY
from pathlib import Path

from pydoll.elements.web_element import WebElement
from pydoll.protocol.runtime.types import CallArgument, SerializationOptions
from pydoll.browser.options import ChromiumOptions

from pydoll.protocol.network.types import ResourceType, RequestMethod
from pydoll.protocol.fetch.types import RequestStage
from pydoll.constants import By, PageLoadState
from pydoll.browser.tab import Tab
from pydoll.utils.bundle import (
    build_asset_filename,
    collect_frame_resources,
    rewrite_css_urls,
)
from pydoll.protocol.page.events import PageEvent
from pydoll.protocol.browser.types import DownloadBehavior
from pydoll.exceptions import DownloadTimeout, InvalidTabInitialization
from pydoll.exceptions import (
    NoDialogPresent,
    PageLoadTimeout,
    IFrameNotFound,
    InvalidIFrame,
    NotAnIFrame,
    InvalidFileExtension,
    WaitElementTimeout,
    NetworkEventsNotEnabled,
    TopLevelTargetRequired,
    InvalidScriptWithElement,
)

@pytest_asyncio.fixture
async def mock_connection_handler():
    """Mock connection handler for Tab tests."""
    with patch('pydoll.connection.ConnectionHandler', autospec=True) as mock:
        handler = mock.return_value
        handler.execute_command = AsyncMock()
        handler.register_callback = AsyncMock()
        handler.remove_callback = AsyncMock()
        handler.clear_callbacks = AsyncMock()
        handler.network_logs = []
        handler.dialog = None
        yield handler


@pytest_asyncio.fixture
async def mock_browser():
    """Mock browser instance."""
    browser = MagicMock()
    browser.close_tab = AsyncMock()
    browser.options = ChromiumOptions()
    return browser


@pytest_asyncio.fixture
async def tab(mock_browser, mock_connection_handler):
    """Tab fixture with mocked dependencies."""
    unique_target_id = f'test-target-{uuid.uuid4().hex[:8]}'
    with patch('pydoll.browser.tab.ConnectionHandler', return_value=mock_connection_handler):
        created = Tab(
            browser=mock_browser,
            connection_port=9222,
            target_id=unique_target_id,
            browser_context_id='test-context-id'
        )
        return created


def assert_mock_called_at_least_once(mock_obj, method_name='execute_command'):
    """
    Helper function to assert that a mock was called at least once.
    This is more robust than assert_called_once() for singleton tests.
    """
    mock_method = getattr(mock_obj, method_name)
    mock_method.assert_called()
    assert mock_method.call_count >= 1


@pytest.fixture(autouse=True)
def cleanup_tab_registry():
    """No-op: singleton removed; keep fixture for compatibility."""
    yield


class TestTabInitialization:
    """Test Tab initialization and basic properties."""

    def test_tab_initialization(self, tab, mock_browser):
        """Test basic Tab initialization."""
        assert tab._browser == mock_browser
        assert tab._connection_port == 9222
        assert tab._target_id.startswith('test-target-')
        assert tab._browser_context_id == 'test-context-id'
        assert not tab.page_events_enabled
        assert not tab.network_events_enabled
        assert not tab.fetch_events_enabled
        assert not tab.dom_events_enabled
        assert not tab.runtime_events_enabled
        assert not tab.intercept_file_chooser_dialog_enabled

    def test_tab_init_raises_when_no_identifiers(self, mock_browser):
        with pytest.raises(InvalidTabInitialization):
            Tab(browser=mock_browser)

    def test_tab_properties(self, tab):
        """Test Tab boolean properties."""
        # Initially all should be False
        assert tab.page_events_enabled is False
        assert tab.network_events_enabled is False
        assert tab.fetch_events_enabled is False
        assert tab.dom_events_enabled is False
        assert tab.runtime_events_enabled is False
        assert tab.intercept_file_chooser_dialog_enabled is False

        # Test setting properties
        tab._page_events_enabled = True
        tab._network_events_enabled = True
        tab._fetch_events_enabled = True
        tab._dom_events_enabled = True
        tab._runtime_events_enabled = True
        tab._intercept_file_chooser_dialog_enabled = True

        assert tab.page_events_enabled is True
        assert tab.network_events_enabled is True
        assert tab.fetch_events_enabled is True
        assert tab.dom_events_enabled is True
        assert tab.runtime_events_enabled is True
        assert tab.intercept_file_chooser_dialog_enabled is True


class TestTabProperties:
    """Test Tab async properties."""

    @pytest.mark.asyncio
    async def test_current_url(self, tab):
        """Test current_url property."""
        tab._connection_handler.execute_command.return_value = {
            'result': {'result': {'value': 'https://example.com'}}
        }

        url = await tab.current_url
        assert url == 'https://example.com'
        # Reset mock before assertion to avoid singleton interference
        tab._connection_handler.execute_command.assert_called()
        assert tab._connection_handler.execute_command.call_count >= 1

    @pytest.mark.asyncio
    async def test_page_source(self, tab):
        """Test page_source property."""
        expected_html = '<html><body>Test Content</body></html>'
        tab._connection_handler.execute_command.return_value = {
            'result': {'result': {'value': expected_html}}
        }

        source = await tab.page_source
        assert source == expected_html
        tab._connection_handler.execute_command.assert_called()
        assert tab._connection_handler.execute_command.call_count >= 1

    @pytest.mark.asyncio
    async def test_title(self, tab):
        """Test title property."""
        tab._connection_handler.execute_command.return_value = {
            'result': {'result': {'value': 'My Page Title'}}
        }

        title = await tab.title
        assert title == 'My Page Title'
        tab._connection_handler.execute_command.assert_called()
        assert tab._connection_handler.execute_command.call_count >= 1

    @pytest.mark.asyncio
    async def test_title_empty(self, tab):
        """Test title property when page has no title."""
        tab._connection_handler.execute_command.return_value = {
            'result': {'result': {}}
        }

        title = await tab.title
        assert title == ''


class TestTabEventManagement:
    """Test Tab event enabling/disabling methods."""

    @pytest.mark.asyncio
    async def test_enable_page_events(self, tab):
        """Test enabling page events."""
        await tab.enable_page_events()
        assert tab.page_events_enabled is True
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_enable_network_events(self, tab):
        """Test enabling network events."""
        await tab.enable_network_events()
        assert tab.network_events_enabled is True
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_enable_fetch_events(self, tab):
        """Test enabling fetch events with default parameters."""
        await tab.enable_fetch_events()
        assert tab.fetch_events_enabled is True
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_enable_fetch_events_with_params(self, tab):
        """Test enabling fetch events with custom parameters."""
        await tab.enable_fetch_events(
            handle_auth=True,
            resource_type=ResourceType.DOCUMENT,
            request_stage=RequestStage.REQUEST
        )
        assert tab.fetch_events_enabled is True
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_enable_dom_events(self, tab):
        """Test enabling DOM events."""
        await tab.enable_dom_events()
        assert tab.dom_events_enabled is True
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_enable_runtime_events(self, tab):
        """Test enabling runtime events."""
        await tab.enable_runtime_events()
        assert tab.runtime_events_enabled is True
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_enable_intercept_file_chooser_dialog(self, tab):
        """Test enabling file chooser dialog interception."""
        await tab.enable_intercept_file_chooser_dialog()
        assert tab.intercept_file_chooser_dialog_enabled is True
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_disable_fetch_events(self, tab):
        """Test disabling fetch events."""
        tab._fetch_events_enabled = True
        await tab.disable_fetch_events()
        assert tab.fetch_events_enabled is False
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_disable_page_events(self, tab):
        """Test disabling page events."""
        tab._page_events_enabled = True
        await tab.disable_page_events()
        assert tab.page_events_enabled is False
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_disable_network_events(self, tab):
        """Test disabling network events."""
        tab._network_events_enabled = True
        await tab.disable_network_events()
        assert tab.network_events_enabled is False
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_disable_dom_events(self, tab):
        """Test disabling DOM events."""
        tab._dom_events_enabled = True
        await tab.disable_dom_events()
        assert tab.dom_events_enabled is False
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_disable_runtime_events(self, tab):
        """Test disabling runtime events."""
        tab._runtime_events_enabled = True
        await tab.disable_runtime_events()
        assert tab.runtime_events_enabled is False
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_disable_intercept_file_chooser_dialog(self, tab):
        """Test disabling file chooser dialog interception."""
        tab._intercept_file_chooser_dialog_enabled = True
        await tab.disable_intercept_file_chooser_dialog()
        assert tab.intercept_file_chooser_dialog_enabled is False
        assert_mock_called_at_least_once(tab._connection_handler)


class TestTabCookieManagement:
    """Test Tab cookie management methods."""

    @pytest.mark.asyncio
    async def test_get_cookies(self, tab):
        """Test getting cookies."""
        test_cookies = [{'name': 'test', 'value': 'value', 'domain': 'example.com'}]
        tab._connection_handler.execute_command.return_value = {
            'result': {'cookies': test_cookies}
        }

        cookies = await tab.get_cookies()
        assert cookies == test_cookies
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_get_cookies_uses_storage_commands_with_browser_context_id(
        self, mock_browser, mock_connection_handler
    ):
        """Test that get_cookies uses StorageCommands when browser_context_id is set.
        
        This ensures proper cookie isolation for explicit browser contexts.
        """
        test_cookies = [{'name': 'isolated', 'value': 'cookie', 'domain': 'example.com'}]
        mock_connection_handler.execute_command.return_value = {
            'result': {'cookies': test_cookies}
        }
        
        with patch('pydoll.browser.tab.ConnectionHandler', return_value=mock_connection_handler):
            tab_with_context = Tab(
                browser=mock_browser,
                connection_port=9222,
                target_id='test-target-with-context',
                browser_context_id='explicit-context-id'
            )
        
        cookies = await tab_with_context.get_cookies()
        
        assert cookies == test_cookies
        # Verify StorageCommands was used (method contains 'Storage.getCookies')
        call_args = mock_connection_handler.execute_command.call_args[0][0]
        assert call_args['method'] == 'Storage.getCookies'
        assert call_args['params']['browserContextId'] == 'explicit-context-id'

    @pytest.mark.asyncio
    async def test_get_cookies_uses_network_commands_without_browser_context_id(
        self, mock_browser, mock_connection_handler
    ):
        """Test that get_cookies uses NetworkCommands when browser_context_id is None.
        
        This is important for incognito mode (--incognito flag) where Storage.getCookies
        does not work properly, but Network.getCookies does.
        """
        test_cookies = [{'name': 'incognito', 'value': 'cookie', 'domain': 'example.com'}]
        mock_connection_handler.execute_command.return_value = {
            'result': {'cookies': test_cookies}
        }
        
        with patch('pydoll.browser.tab.ConnectionHandler', return_value=mock_connection_handler):
            tab_without_context = Tab(
                browser=mock_browser,
                connection_port=9222,
                target_id='test-target-no-context',
                browser_context_id=None  # No explicit context (incognito/default mode)
            )
        
        cookies = await tab_without_context.get_cookies()
        
        assert cookies == test_cookies
        # Verify NetworkCommands was used (method contains 'Network.getCookies')
        call_args = mock_connection_handler.execute_command.call_args[0][0]
        assert call_args['method'] == 'Network.getCookies'

    @pytest.mark.asyncio
    async def test_set_cookies(self, tab):
        """Test setting cookies."""
        test_cookies = [{'name': 'test', 'value': 'value', 'domain': 'example.com'}]
        await tab.set_cookies(test_cookies)
        
        # Should call Network command for each cookie
        assert tab._connection_handler.execute_command.call_count == 1

    @pytest.mark.asyncio
    async def test_delete_all_cookies(self, tab):
        """Test deleting all cookies."""
        await tab.delete_all_cookies()
        
        # Should call Network command to clear cookies
        assert tab._connection_handler.execute_command.call_count == 1


class TestTabNavigation:
    """Test Tab navigation methods."""

    @pytest.mark.asyncio
    async def test_go_to_new_url(self, tab):
        """Test navigating to a new URL."""
        tab._connection_handler.execute_command.side_effect = [
            {'result': {'result': {'value': 'https://old-url.com'}}},  # current_url
            {'result': {}},  # Page.enable
            {'result': {'frameId': 'frame-id'}},  # navigate command
            {'result': {}},  # Page.disable
        ]

        async def fire_callback(event_name, callback, temporary=False):
            callback({'method': event_name, 'params': {}})
            return 1

        tab._connection_handler.register_callback = AsyncMock(side_effect=fire_callback)

        await tab.go_to('https://example.com')

        assert tab._connection_handler.execute_command.call_count == 4

    @pytest.mark.asyncio
    async def test_go_to_same_url(self, tab):
        """Test navigating to the same URL (should refresh)."""
        tab._connection_handler.execute_command.side_effect = [
            {'result': {'result': {'value': 'https://example.com'}}},  # current_url
            {'result': {}},  # Page.enable
            {'result': {}},  # refresh command
            {'result': {}},  # Page.disable
        ]

        async def fire_callback(event_name, callback, temporary=False):
            callback({'method': event_name, 'params': {}})
            return 1

        tab._connection_handler.register_callback = AsyncMock(side_effect=fire_callback)

        await tab.go_to('https://example.com')

        assert tab._connection_handler.execute_command.call_count == 4

    @pytest.mark.asyncio
    async def test_go_to_timeout(self, tab):
        """Test navigation timeout."""
        tab._connection_handler.execute_command.side_effect = [
            {'result': {'result': {'value': 'https://old-url.com'}}},  # current_url
            {'result': {}},  # Page.enable
            {'result': {'frameId': 'frame-id'}},  # navigate command
            {'result': {}},  # Page.disable
        ]

        # Don't fire the callback so the wait times out
        tab._connection_handler.register_callback = AsyncMock(return_value=1)

        with pytest.raises(PageLoadTimeout):
            await tab.go_to('https://example.com', timeout=0.1)

    @pytest.mark.asyncio
    async def test_refresh(self, tab):
        """Test page refresh."""
        tab._connection_handler.execute_command.side_effect = [
            {'result': {}},  # Page.enable
            {'result': {}},  # refresh command
            {'result': {}},  # Page.disable
        ]

        async def fire_callback(event_name, callback, temporary=False):
            callback({'method': event_name, 'params': {}})
            return 1

        tab._connection_handler.register_callback = AsyncMock(side_effect=fire_callback)

        await tab.refresh()

        assert tab._connection_handler.execute_command.call_count == 3

    @pytest.mark.asyncio
    async def test_refresh_with_params(self, tab):
        """Test page refresh with parameters."""
        tab._connection_handler.execute_command.side_effect = [
            {'result': {}},  # Page.enable
            {'result': {}},  # refresh command
            {'result': {}},  # Page.disable
        ]

        async def fire_callback(event_name, callback, temporary=False):
            callback({'method': event_name, 'params': {}})
            return 1

        tab._connection_handler.register_callback = AsyncMock(side_effect=fire_callback)

        await tab.refresh(ignore_cache=True, script_to_evaluate_on_load='console.log("test")')

        assert tab._connection_handler.execute_command.call_count == 3


class TestTabScreenshotAndPDF:
    """Test Tab screenshot and PDF methods."""

    @pytest.mark.asyncio
    async def test_take_screenshot_to_file(self, tab, tmp_path):
        """Test taking screenshot and saving to file."""
        screenshot_data = 'iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAQAAAC1HAwCAAAAC0lEQVR42mP8/wcAAgAB/edzE+oAAAAASUVORK5CYII='
        tab._connection_handler.execute_command.return_value = {
            'result': {'data': screenshot_data}
        }
        
        screenshot_path = tmp_path / 'screenshot.png'
        
        # Mock aiofiles.open properly for async context manager
        mock_file = AsyncMock()
        mock_file.write = AsyncMock()
        
        with patch('aiofiles.open') as mock_aiofiles_open:
            mock_aiofiles_open.return_value.__aenter__.return_value = mock_file
            result = await tab.take_screenshot(str(screenshot_path))
        
        assert result is None  # Should return None when saving to file
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_take_screenshot_as_base64(self, tab):
        """Test taking screenshot and returning as base64."""
        screenshot_data = 'iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAQAAAC1HAwCAAAAC0lEQVR42mP8/wcAAgAB/edzE+oAAAAASUVORK5CYII='
        tab._connection_handler.execute_command.return_value = {
            'result': {'data': screenshot_data}
        }
        
        result = await tab.take_screenshot('screenshot.png', as_base64=True)
        
        assert result == screenshot_data
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_take_screenshot_beyond_viewport(self, tab):
        """Test capture_beyond_viewport flag is forwarded to command."""
        screenshot_data = 'iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAQAAAC1HAwCAAAAC0lEQVR42mP8/wcAAgAB/edzE+oAAAAASUVORK5CYII='

        with patch.object(tab, '_execute_command', AsyncMock(return_value={
            'result': {'data': screenshot_data}
        })) as mock_execute:
            result = await tab.take_screenshot(
                path=None,
                beyond_viewport=True,
                as_base64=True,
            )

            mock_execute.assert_called_once()
            command = mock_execute.call_args[0][0]
            assert command['method'] == 'Page.captureScreenshot'
            assert command['params']['captureBeyondViewport'] is True
            assert result == screenshot_data

    @pytest.mark.asyncio
    async def test_take_screenshot_in_iframe_raises_top_level_required(self, tab):
        """Tab.take_screenshot must be called on top-level targets; iframe Tab raises."""
        # Simulate CDP returning no image data (missing 'data' key) for non top-level target
        with patch.object(tab, '_execute_command', AsyncMock(return_value={'result': {}})):
            with pytest.raises(TopLevelTargetRequired):
                await tab.take_screenshot(path=None, as_base64=True)

    @pytest.mark.asyncio
    async def test_print_to_pdf_to_file(self, tab, tmp_path):
        """Test printing to PDF and saving to file."""
        pdf_data = 'JVBERi0xLjQKJdPr6eEKMSAwIG9iago8PAovVHlwZSAvQ2F0YWxvZwo+PgplbmRvYmoKdHJhaWxlcgo8PAovUm9vdCAxIDAgUgo+PgpzdGFydHhyZWYKMTgKJSVFT0Y='
        tab._connection_handler.execute_command.return_value = {
            'result': {'data': pdf_data}
        }
        
        pdf_path = tmp_path / 'document.pdf'
        
        # Mock aiofiles.open properly for async context manager
        mock_file = AsyncMock()
        mock_file.write = AsyncMock()
        
        with patch('aiofiles.open') as mock_aiofiles_open:
            mock_aiofiles_open.return_value.__aenter__.return_value = mock_file
            result = await tab.print_to_pdf(str(pdf_path))
        
        assert result is None  # Should return None when saving to file
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_print_to_pdf_as_base64(self, tab):
        """Test printing to PDF and returning as base64."""
        pdf_data = 'JVBERi0xLjQKJdPr6eEKMSAwIG9iago8PAovVHlwZSAvQ2F0YWxvZwo+PgplbmRvYmoKdHJhaWxlcgo8PAovUm9vdCAxIDAgUgo+PgpzdGFydHhyZWYKMTgKJSVFT0Y='
        tab._connection_handler.execute_command.return_value = {
            'result': {'data': pdf_data}
        }
        
        result = await tab.print_to_pdf(as_base64=True)
        
        assert result == pdf_data
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_print_to_pdf_with_options(self, tab, tmp_path):
        """Test printing to PDF with custom options."""
        pdf_data = 'JVBERi0xLjQKJdPr6eEKMSAwIG9iago8PAovVHlwZSAvQ2F0YWxvZwo+PgplbmRvYmoKdHJhaWxlcgo8PAovUm9vdCAxIDAgUgo+PgpzdGFydHhyZWYKMTgKJSVFT0Y='
        tab._connection_handler.execute_command.return_value = {
            'result': {'data': pdf_data}
        }
        
        pdf_path = tmp_path / 'document.pdf'
        
        # Mock aiofiles.open properly for async context manager
        mock_file = AsyncMock()
        mock_file.write = AsyncMock()
        
        with patch('aiofiles.open') as mock_aiofiles_open:
            mock_aiofiles_open.return_value.__aenter__.return_value = mock_file
            result = await tab.print_to_pdf(
                str(pdf_path),
                landscape=True,
                display_header_footer=True,
                print_background=False,
                scale=0.8
            )
        
        assert result is None
        assert_mock_called_at_least_once(tab._connection_handler)


class TestTabDialogHandling:
    """Test Tab dialog handling methods."""

    @pytest.mark.asyncio
    async def test_has_dialog_true(self, tab):
        """Test has_dialog when dialog is present."""
        tab._connection_handler.dialog = {'params': {'type': 'alert', 'message': 'Test'}}
        
        result = await tab.has_dialog()
        assert result is True

    @pytest.mark.asyncio
    async def test_has_dialog_false(self, tab):
        """Test has_dialog when no dialog is present."""
        tab._connection_handler.dialog = None
        
        result = await tab.has_dialog()
        assert result is False

    @pytest.mark.asyncio
    async def test_get_dialog_message_success(self, tab):
        """Test getting dialog message when dialog is present."""
        tab._connection_handler.dialog = {'params': {'message': 'Test message'}}
        
        message = await tab.get_dialog_message()
        assert message == 'Test message'

    @pytest.mark.asyncio
    async def test_get_dialog_message_no_dialog(self, tab):
        """Test getting dialog message when no dialog is present."""
        tab._connection_handler.dialog = None
        
        with pytest.raises(NoDialogPresent):
            await tab.get_dialog_message()

    @pytest.mark.asyncio
    async def test_handle_dialog_accept(self, tab):
        """Test accepting a dialog."""
        tab._connection_handler.dialog = {'params': {'type': 'alert'}}
        
        await tab.handle_dialog(accept=True)
        
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_handle_dialog_dismiss(self, tab):
        """Test dismissing a dialog."""
        tab._connection_handler.dialog = {'params': {'type': 'confirm'}}
        
        await tab.handle_dialog(accept=False)
        
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_handle_dialog_with_prompt_text(self, tab):
        """Test handling a prompt dialog with text."""
        tab._connection_handler.dialog = {'params': {'type': 'prompt'}}
        
        await tab.handle_dialog(accept=True, prompt_text='Test input')
        
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_handle_dialog_no_dialog(self, tab):
        """Test handling dialog when none is present."""
        tab._connection_handler.dialog = None
        
        with pytest.raises(NoDialogPresent):
            await tab.handle_dialog(accept=True)


class TestTabScriptExecution:
    """Test Tab script execution methods."""

    @pytest.mark.asyncio
    async def test_execute_script_simple(self, tab):
        """Test execute_script with simple JavaScript."""
        tab._connection_handler.execute_command.return_value = {
            'result': {'result': {'value': 'Test Result'}}
        }
        
        result = await tab.execute_script('return "Test Result"')
        
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_execute_script_return_outside_function(self, tab):
        """Test execute_script wraps return statement outside function."""
        tab._connection_handler.execute_command.return_value = {
            'result': {'result': {'value': 'Wrapped result'}}
        }
        
        # Script with return outside function should be wrapped
        result = await tab.execute_script('return document.title')
        
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_execute_script_return_inside_function(self, tab):
        """Test execute_script doesn't wrap when return is inside function."""
        tab._connection_handler.execute_command.return_value = {
            'result': {'result': {'value': 'Function result'}}
        }
        
        # Script with return inside function should not be wrapped
        script = '''
        function getTitle() {
            return document.title;
        }
        getTitle();
        '''
        result = await tab.execute_script(script)
        
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_execute_script_no_return_statement(self, tab):
        """Test execute_script without return statement."""
        tab._connection_handler.execute_command.return_value = {
            'result': {'result': {'value': None}}
        }
        
        # Script without return should not be wrapped
        result = await tab.execute_script('console.log("Hello World")')
        
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_execute_script_with_comments_and_strings(self, tab):
        """Test execute_script handles comments and strings correctly."""
        tab._connection_handler.execute_command.return_value = {
            'result': {'result': {'value': 'Test with comments'}}
        }
        
        # Script with comments and strings containing 'return'
        script = '''
        // This comment has return in it
        var message = "This string has return in it";
        /* This block comment also has return */
        return "actual return";
        '''
        result = await tab.execute_script(script)
        
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_execute_script_already_wrapped_function(self, tab):
        """Test execute_script with already wrapped function."""
        tab._connection_handler.execute_command.return_value = {
            'result': {'result': {'value': 'Already wrapped'}}
        }
        
        # Script already wrapped in function should not be wrapped again
        script = 'function() { console.log("test"); return "done"; }'
        result = await tab.execute_script(script)
        
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_execute_script_with_webelement_deprecation_warning(self, tab):
        """Test execute_script with WebElement triggers deprecation warning."""
        mock_element = Mock(spec=WebElement)
        mock_element.execute_script.return_value = {'result': {'value': 'element result'}}
        
        with pytest.warns(DeprecationWarning, match="Passing a WebElement to Tab.execute_script\\(\\) is deprecated"):
            result = await tab.execute_script('return this.tagName', element=mock_element)
        
        mock_element.execute_script.assert_called_once_with(
            'return this.tagName',
            arguments=None,
            silent=None,
            return_by_value=None,
            generate_preview=None,
            user_gesture=None,
            await_promise=None,
            execution_context_id=None,
            object_group=None,
            throw_on_side_effect=None,
            unique_context_id=None,
            serialization_options=None,
        )
        
        assert result == {'result': {'value': 'element result'}}

    @pytest.mark.asyncio
    async def test_execute_script_with_webelement_all_parameters(self, tab):
        """Test execute_script with WebElement passes all parameters correctly."""
        mock_element = Mock(spec=WebElement)
        mock_element.execute_script.return_value = {'result': {'value': 'element result'}}
        
        arguments = [CallArgument(value="test")]
        serialization_options = SerializationOptions(serialization="deep")
        
        with pytest.warns(DeprecationWarning):
            result = await tab.execute_script(
                'return this.tagName',
                element=mock_element,
                arguments=arguments,
                silent=True,
                return_by_value=True,
                generate_preview=True,
                user_gesture=True,
                await_promise=True,
                execution_context_id=123,
                object_group="test_group",
                throw_on_side_effect=True,
                unique_context_id="unique_123",
                serialization_options=serialization_options,
            )
        
        mock_element.execute_script.assert_called_once_with(
            'return this.tagName',
            arguments=arguments,
            silent=True,
            return_by_value=True,
            generate_preview=True,
            user_gesture=True,
            await_promise=True,
            execution_context_id=123,
            object_group="test_group",
            throw_on_side_effect=True,
            unique_context_id="unique_123",
            serialization_options=serialization_options,
        )
        
        assert result == {'result': {'value': 'element result'}}

    @pytest.mark.parametrize('response', [
        {},
        {'result': 'not a dict'},
        {'result': {}},
        {'result': {'result': 'not a dict'}},
        {'result': {'result': {'type': 'string', 'subtype': 'error', 'className': 'ReferenceError', 'description': 'argument is not defined'}}},
        {'result': {'result': {'type': 'object', 'subtype': 'not_error', 'className': 'ReferenceError', 'description': 'argument is not defined'}}},
        {'result': {'result': {'type': 'object', 'subtype': 'error', 'className': 'TypeError', 'description': 'argument is not defined'}}},
        {'result': {'result': {'type': 'object', 'subtype': 'error', 'className': 'ReferenceError', 'description': 'some other error'}}},
        {'result': {'result': {'type': 'object', 'subtype': 'error', 'className': 'ReferenceError', 'description': ''}}},
        {'result': {'result': {'type': 'object', 'subtype': 'error', 'className': 'ReferenceError'}}},
    ])
    def test_validate_argument_error_early_returns(self, tab, response):
        """Test _validate_argument_error returns early for invalid responses."""
        tab._validate_argument_error(response)

    @pytest.mark.parametrize('description', [
        'argument is not defined',
        'Error: argument is not defined at line 1',
    ])
    def test_validate_argument_error_raises_on_match(self, tab, description):
        """Test _validate_argument_error raises InvalidScriptWithElement when all conditions match."""
        response = {
            'result': {
                'result': {
                    'type': 'object',
                    'subtype': 'error',
                    'className': 'ReferenceError',
                    'description': description,
                }
            }
        }
        with pytest.raises(InvalidScriptWithElement, match='Script contains "argument" but no element was provided'):
            tab._validate_argument_error(response)

    @pytest.mark.asyncio
    async def test_execute_script_triggers_validation(self, tab):
        """Test that execute_script calls _validate_argument_error when script fails with ReferenceError."""
        tab._connection_handler.execute_command.return_value = {
            'result': {
                'result': {
                    'type': 'object',
                    'subtype': 'error',
                    'className': 'ReferenceError',
                    'description': 'argument is not defined'
                }
            }
        }
        with pytest.raises(InvalidScriptWithElement, match='Script contains "argument" but no element was provided'):
            await tab.execute_script('argument.click()')


class TestTabEventCallbacks:
    """Test Tab event callback management."""

    @pytest.mark.asyncio
    async def test_on_callback_registration(self, tab):
        """Test registering event callbacks."""
        callback_id = 123
        tab._connection_handler.register_callback.return_value = callback_id
        
        async def test_callback(event):
            pass
        
        result = await tab.on('Page.loadEventFired', test_callback)
        
        assert result == callback_id
        assert_mock_called_at_least_once(tab._connection_handler, 'register_callback')

    @pytest.mark.asyncio
    async def test_on_temporary_callback(self, tab):
        """Test registering temporary event callbacks."""
        callback_id = 456
        tab._connection_handler.register_callback.return_value = callback_id
        
        async def test_callback(event):
            pass
        
        result = await tab.on('Page.loadEventFired', test_callback, temporary=True)
        
        assert result == callback_id
        tab._connection_handler.register_callback.assert_called_with(
            'Page.loadEventFired', ANY, True
        )
        assert tab._connection_handler.register_callback.call_count >= 1

    @pytest.mark.asyncio
    async def test_remove_callback_success(self, tab):
        """Tab.remove_callback should forward to connection handler and return True."""
        tab._connection_handler.remove_callback.return_value = True

        result = await tab.remove_callback(123)

        tab._connection_handler.remove_callback.assert_called_with(123)
        assert result is True

    @pytest.mark.asyncio
    async def test_remove_callback_false(self, tab):
        """Tab.remove_callback should return False when handler returns False."""
        tab._connection_handler.remove_callback.return_value = False

        result = await tab.remove_callback(999)

        tab._connection_handler.remove_callback.assert_called_with(999)
        assert result is False


class TestTabFileChooser:
    """Test Tab file chooser functionality."""

    @pytest.mark.asyncio
    async def test_expect_file_chooser_single_file(self, tab):
        """Test expect_file_chooser with single file."""
        tab._connection_handler.register_callback.return_value = 123
        
        # Set initial state to False so methods get called
        tab._page_events_enabled = False
        tab._intercept_file_chooser_dialog_enabled = False
        
        mock_enable_page_events = AsyncMock()
        mock_enable_intercept = AsyncMock(side_effect=lambda: setattr(tab, '_intercept_file_chooser_dialog_enabled', True))
        mock_disable_intercept = AsyncMock()
        mock_on = AsyncMock()
        
        with patch.object(tab, 'enable_page_events', mock_enable_page_events):
            with patch.object(tab, 'enable_intercept_file_chooser_dialog', mock_enable_intercept):
                with patch.object(tab, 'disable_intercept_file_chooser_dialog', mock_disable_intercept):
                    with patch.object(tab, 'on', mock_on):
                        async with tab.expect_file_chooser('test.txt'):
                            pass
        
        mock_enable_page_events.assert_awaited_once()
        mock_enable_intercept.assert_awaited_once()
        mock_disable_intercept.assert_awaited_once()

    @pytest.mark.asyncio
    async def test_expect_file_chooser_multiple_files(self, tab):
        """Test expect_file_chooser with multiple files."""
        tab._connection_handler.register_callback.return_value = 456
        
        files = ['file1.txt', 'file2.txt', 'file3.txt']
        
        # Set initial state to False so methods get called
        tab._page_events_enabled = False
        tab._intercept_file_chooser_dialog_enabled = False
        
        mock_enable_page_events = AsyncMock()
        mock_enable_intercept = AsyncMock(side_effect=lambda: setattr(tab, '_intercept_file_chooser_dialog_enabled', True))
        mock_disable_intercept = AsyncMock()
        mock_on = AsyncMock()
        
        with patch.object(tab, 'enable_page_events', mock_enable_page_events):
            with patch.object(tab, 'enable_intercept_file_chooser_dialog', mock_enable_intercept):
                with patch.object(tab, 'disable_intercept_file_chooser_dialog', mock_disable_intercept):
                    with patch.object(tab, 'on', mock_on):
                        async with tab.expect_file_chooser(files):
                            pass
        
        mock_enable_page_events.assert_called_once()
        mock_enable_intercept.assert_called_once()
        mock_disable_intercept.assert_called_once()

    @pytest.mark.asyncio
    async def test_expect_file_chooser_with_path_objects(self, tab):
        """Test expect_file_chooser with Path objects."""
        tab._connection_handler.register_callback.return_value = 789
        
        files = [Path('file1.txt'), Path('file2.txt')]
        
        # Set initial state to False so methods get called
        tab._page_events_enabled = False
        tab._intercept_file_chooser_dialog_enabled = False
        
        mock_enable_page_events = AsyncMock()
        mock_enable_intercept = AsyncMock(side_effect=lambda: setattr(tab, '_intercept_file_chooser_dialog_enabled', True))
        mock_disable_intercept = AsyncMock()
        mock_on = AsyncMock()
        
        with patch.object(tab, 'enable_page_events', mock_enable_page_events):
            with patch.object(tab, 'enable_intercept_file_chooser_dialog', mock_enable_intercept):
                with patch.object(tab, 'disable_intercept_file_chooser_dialog', mock_disable_intercept):
                    with patch.object(tab, 'on', mock_on):
                        async with tab.expect_file_chooser(files):
                            pass
        
        mock_enable_page_events.assert_called_once()
        mock_enable_intercept.assert_called_once()
        mock_disable_intercept.assert_called_once()

    @pytest.mark.asyncio
    async def test_expect_file_chooser_event_handler_single_file(self, tab):
        """Test the real event_handler function with single file."""
        from pydoll.protocol.page.events import FileChooserOpenedEvent, PageEvent
        
        # Mock execute_command to capture the call
        tab._execute_command = AsyncMock()
        
        # Create mock event data
        mock_event: FileChooserOpenedEvent = {
            'method': 'Page.fileChooserOpened',
            'params': {
                'frameId': 'test-frame-id',
                'mode': 'selectSingle',
                'backendNodeId': 12345
            }
        }
        
        # Capture the real event handler from expect_file_chooser
        captured_handler = None
        
        async def mock_on(event_name, handler, temporary=False):
            nonlocal captured_handler
            if event_name == PageEvent.FILE_CHOOSER_OPENED:
                captured_handler = handler
            return 123
        
        # Mock the required methods
        with patch.object(tab, 'enable_page_events', AsyncMock()):
            with patch.object(tab, 'enable_intercept_file_chooser_dialog', AsyncMock()):
                with patch.object(tab, 'disable_intercept_file_chooser_dialog', AsyncMock()):
                    with patch.object(tab, 'disable_page_events', AsyncMock()):
                        with patch.object(tab, 'on', mock_on):
                            async with tab.expect_file_chooser('test.txt'):
                                # Execute the captured real handler
                                assert captured_handler is not None
                                await captured_handler(mock_event)
        
        # Verify the command was called correctly
        tab._execute_command.assert_called_once()
        call_args = tab._execute_command.call_args[0][0]
        assert call_args['method'] == 'DOM.setFileInputFiles'
        assert call_args['params']['files'] == ['test.txt']
        assert call_args['params']['backendNodeId'] == 12345

    @pytest.mark.asyncio
    async def test_expect_file_chooser_event_handler_multiple_files(self, tab):
        """Test the real event_handler function with multiple files."""
        from pydoll.protocol.page.events import FileChooserOpenedEvent, PageEvent
        
        # Mock execute_command to capture the call
        tab._execute_command = AsyncMock()
        
        # Create mock event data
        mock_event: FileChooserOpenedEvent = {
            'method': 'Page.fileChooserOpened',
            'params': {
                'frameId': 'test-frame-id',
                'mode': 'selectMultiple',
                'backendNodeId': 67890
            }
        }

        # Capture the real event handler from expect_file_chooser
        captured_handler = None
        
        async def mock_on(event_name, handler, temporary=False):
            nonlocal captured_handler
            if event_name == PageEvent.FILE_CHOOSER_OPENED:
                captured_handler = handler
            return 123
        
        # Mock the required methods
        with patch.object(tab, 'enable_page_events', AsyncMock()):
            with patch.object(tab, 'enable_intercept_file_chooser_dialog', AsyncMock()):
                with patch.object(tab, 'disable_intercept_file_chooser_dialog', AsyncMock()):
                    with patch.object(tab, 'disable_page_events', AsyncMock()):
                        with patch.object(tab, 'on', mock_on):
                            async with tab.expect_file_chooser(['file1.txt', 'file2.pdf', 'file3.jpg']):
                                # Execute the captured real handler
                                assert captured_handler is not None
                                await captured_handler(mock_event)
        
        # Verify the command was called correctly
        tab._execute_command.assert_called_once()
        call_args = tab._execute_command.call_args[0][0]
        assert call_args['method'] == 'DOM.setFileInputFiles'
        assert call_args['params']['files'] == ['file1.txt', 'file2.pdf', 'file3.jpg']
        assert call_args['params']['backendNodeId'] == 67890

    async def _test_event_handler_with_files(self, tab, files, expected_files, backend_node_id):
        """Helper method to test event handler with different file types."""
        from pydoll.protocol.page.events import FileChooserOpenedEvent, PageEvent
        
        # Mock execute_command to capture the call
        tab._execute_command = AsyncMock()
        
        # Create mock event data
        mock_event: FileChooserOpenedEvent = {
            'method': 'Page.fileChooserOpened',
            'params': {
                'frameId': 'test-frame-id',
                'mode': 'selectMultiple',
                'backendNodeId': backend_node_id
            }
        }
        
        # Capture the real event handler from expect_file_chooser
        captured_handler = None
        
        async def mock_on(event_name, handler, temporary=False):
            nonlocal captured_handler
            if event_name == PageEvent.FILE_CHOOSER_OPENED:
                captured_handler = handler
            return 123
        
        # Mock the required methods
        with patch.object(tab, 'enable_page_events', AsyncMock()):
            with patch.object(tab, 'enable_intercept_file_chooser_dialog', AsyncMock()):
                with patch.object(tab, 'disable_intercept_file_chooser_dialog', AsyncMock()):
                    with patch.object(tab, 'disable_page_events', AsyncMock()):
                        with patch.object(tab, 'on', mock_on):
                            async with tab.expect_file_chooser(files):
                                # Execute the captured real handler
                                assert captured_handler is not None
                                await captured_handler(mock_event)
        
        # Verify the command was called correctly
        tab._execute_command.assert_called_once()
        call_args = tab._execute_command.call_args[0][0]
        assert call_args['method'] == 'DOM.setFileInputFiles'
        assert call_args['params']['files'] == expected_files
        assert call_args['params']['backendNodeId'] == backend_node_id

    @pytest.mark.asyncio
    async def test_expect_file_chooser_event_handler_path_objects(self, tab):
        """Test the real event_handler function with Path objects."""
        from pathlib import Path
        
        files = [Path('documents/file1.txt'), Path('images/file2.jpg')]
        expected_files = [str(file) for file in files]
        
        await self._test_event_handler_with_files(tab, files, expected_files, 54321)

    @pytest.mark.asyncio
    async def test_expect_file_chooser_event_handler_single_path_object(self, tab):
        """Test the real event_handler function with single Path object."""
        from pathlib import Path
        
        files = Path('documents/important.pdf')
        expected_files = [str(files)]
        
        await self._test_event_handler_with_files(tab, files, expected_files, 98765)

    @pytest.mark.asyncio
    async def test_expect_file_chooser_event_handler_empty_list(self, tab):
        """Test the real event_handler function with empty file list."""
        files = []
        expected_files = []
        
        await self._test_event_handler_with_files(tab, files, expected_files, 11111)


class TestTabCloudflareBypass:
    """Test Tab Cloudflare bypass functionality."""

    @pytest.mark.asyncio
    async def test_enable_auto_solve_cloudflare_captcha(self, tab):
        """Test enabling auto-solve Cloudflare captcha."""
        callback_id = 999
        tab._connection_handler.register_callback.return_value = callback_id

        mock_enable_page_events = AsyncMock()
        with patch.object(tab, 'enable_page_events', mock_enable_page_events):
            await tab.enable_auto_solve_cloudflare_captcha()

        mock_enable_page_events.assert_called_once()
        assert_mock_called_at_least_once(tab._connection_handler, 'register_callback')
        assert tab._cloudflare_captcha_callback_id == callback_id

    @pytest.mark.asyncio
    async def test_enable_auto_solve_cloudflare_captcha_with_params(self, tab):
        """Test enabling auto-solve Cloudflare captcha with timing parameters."""
        callback_id = 888
        tab._connection_handler.register_callback.return_value = callback_id

        mock_enable_page_events = AsyncMock()
        with patch.object(tab, 'enable_page_events', mock_enable_page_events):
            await tab.enable_auto_solve_cloudflare_captcha(
                time_to_wait_captcha=10,
            )

        mock_enable_page_events.assert_called_once()
        assert_mock_called_at_least_once(tab._connection_handler, 'register_callback')
        assert tab._cloudflare_captcha_callback_id == callback_id

    @pytest.mark.asyncio
    async def test_disable_auto_solve_cloudflare_captcha(self, tab):
        """Test disabling auto-solve Cloudflare captcha."""
        tab._cloudflare_captcha_callback_id = 777
        tab._connection_handler.remove_callback.return_value = True

        await tab.disable_auto_solve_cloudflare_captcha()

        tab._connection_handler.remove_callback.assert_called_with(777)

    @pytest.mark.asyncio
    async def test_expect_and_bypass_cloudflare_captcha(self, tab):
        """Test expect_and_bypass_cloudflare_captcha context manager."""
        mock_event = MagicMock()
        mock_event.wait = AsyncMock()

        callback_id = 666
        tab._connection_handler.register_callback.return_value = callback_id

        mock_enable_page_events = AsyncMock()
        mock_disable_page_events = AsyncMock()

        with patch.object(tab, 'enable_page_events', mock_enable_page_events):
            with patch.object(tab, 'disable_page_events', mock_disable_page_events):
                with patch('asyncio.Event', return_value=mock_event):
                    async with tab.expect_and_bypass_cloudflare_captcha():
                        pass

        mock_enable_page_events.assert_called_once()
        mock_disable_page_events.assert_called_once()
        assert_mock_called_at_least_once(tab._connection_handler, 'register_callback')
        tab._connection_handler.remove_callback.assert_called_with(callback_id)

    @pytest.mark.asyncio
    async def test_bypass_cloudflare_with_shadow_root_traversal(self, tab):
        """Test _bypass_cloudflare traverses shadow roots to click checkbox."""
        mock_checkbox = AsyncMock()
        mock_inner_shadow = AsyncMock()
        mock_inner_shadow.query = AsyncMock(return_value=mock_checkbox)
        mock_body = AsyncMock()
        mock_body.get_shadow_root = AsyncMock(return_value=mock_inner_shadow)
        mock_iframe = AsyncMock()
        mock_iframe.find = AsyncMock(return_value=mock_body)
        mock_shadow_root = AsyncMock()
        mock_shadow_root.query = AsyncMock(return_value=mock_iframe)

        mock_find_cf = AsyncMock(return_value=mock_shadow_root)

        with patch.object(tab, '_find_cloudflare_shadow_root', mock_find_cf):
            await tab._bypass_cloudflare({})

        mock_find_cf.assert_called_once_with(timeout=5)
        mock_shadow_root.query.assert_called_once()
        mock_iframe.find.assert_called_once()
        mock_body.get_shadow_root.assert_called_once()
        mock_inner_shadow.query.assert_called_once()
        mock_checkbox.click.assert_called_once()

    @pytest.mark.asyncio
    async def test_bypass_cloudflare_no_shadow_root_found(self, tab):
        """Test _bypass_cloudflare logs error when shadow root not found."""
        mock_find_cf = AsyncMock(
            side_effect=WaitElementTimeout('Timed out')
        )

        with patch.object(tab, '_find_cloudflare_shadow_root', mock_find_cf):
            # Should not raise — error is caught and logged
            await tab._bypass_cloudflare({})

        mock_find_cf.assert_called_once()

    @pytest.mark.asyncio
    async def test_bypass_cloudflare_custom_selector_emits_deprecation(self, tab):
        """Test that passing custom_selector emits DeprecationWarning."""
        callback_id = 111
        tab._connection_handler.register_callback.return_value = callback_id

        mock_enable_page_events = AsyncMock()
        with patch.object(tab, 'enable_page_events', mock_enable_page_events):
            with pytest.warns(DeprecationWarning, match='custom_selector is deprecated'):
                await tab.enable_auto_solve_cloudflare_captcha(
                    custom_selector=(By.ID, 'custom-captcha'),
                )

    @pytest.mark.asyncio
    async def test_time_before_click_emits_deprecation(self, tab):
        """Test that passing time_before_click emits DeprecationWarning."""
        callback_id = 112
        tab._connection_handler.register_callback.return_value = callback_id

        mock_enable_page_events = AsyncMock()
        with patch.object(tab, 'enable_page_events', mock_enable_page_events):
            with pytest.warns(DeprecationWarning, match='time_before_click is deprecated'):
                await tab.enable_auto_solve_cloudflare_captcha(
                    time_before_click=3,
                )

    @pytest.mark.asyncio
    async def test_expect_bypass_time_before_click_emits_deprecation(self, tab):
        """Test that expect_and_bypass with time_before_click emits DeprecationWarning."""
        mock_event = MagicMock()
        mock_event.wait = AsyncMock()

        tab._connection_handler.register_callback.return_value = 223

        mock_enable_page_events = AsyncMock()
        mock_disable_page_events = AsyncMock()

        with patch.object(tab, 'enable_page_events', mock_enable_page_events):
            with patch.object(tab, 'disable_page_events', mock_disable_page_events):
                with patch('asyncio.Event', return_value=mock_event):
                    with pytest.warns(DeprecationWarning, match='time_before_click is deprecated'):
                        async with tab.expect_and_bypass_cloudflare_captcha(
                            time_before_click=2,
                        ):
                            pass

    @pytest.mark.asyncio
    async def test_expect_bypass_custom_selector_emits_deprecation(self, tab):
        """Test that expect_and_bypass with custom_selector emits DeprecationWarning."""
        mock_event = MagicMock()
        mock_event.wait = AsyncMock()

        tab._connection_handler.register_callback.return_value = 222

        mock_enable_page_events = AsyncMock()
        mock_disable_page_events = AsyncMock()

        with patch.object(tab, 'enable_page_events', mock_enable_page_events):
            with patch.object(tab, 'disable_page_events', mock_disable_page_events):
                with patch('asyncio.Event', return_value=mock_event):
                    with pytest.warns(DeprecationWarning, match='custom_selector is deprecated'):
                        async with tab.expect_and_bypass_cloudflare_captcha(
                            custom_selector=(By.ID, 'old-sel'),
                        ):
                            pass

    @pytest.mark.asyncio
    async def test_find_cloudflare_shadow_root_polls_until_found(self, tab):
        """Test _find_cloudflare_shadow_root polls until CF shadow root appears."""

        class MockShadowRoot:
            def __init__(self, html):
                self._html = html

            @property
            async def inner_html(self):
                return self._html

        non_cf_sr = MockShadowRoot('<div>other content</div>')
        cf_sr = MockShadowRoot(
            '<iframe src="https://challenges.cloudflare.com/cdn-cgi/"></iframe>'
        )

        call_count = 0

        async def mock_find_shadow_roots(deep=False):
            nonlocal call_count
            call_count += 1
            if call_count == 1:
                return [non_cf_sr]
            return [non_cf_sr, cf_sr]

        with patch.object(tab, 'find_shadow_roots', side_effect=mock_find_shadow_roots):
            with patch('asyncio.sleep', AsyncMock()):
                result = await tab._find_cloudflare_shadow_root(timeout=10)

        assert result is cf_sr
        assert call_count == 2

    @pytest.mark.asyncio
    async def test_find_cloudflare_shadow_root_timeout(self, tab):
        """Test _find_cloudflare_shadow_root raises WaitElementTimeout on timeout."""

        class MockShadowRoot:
            @property
            async def inner_html(self):
                return '<div>other content</div>'

        non_cf_sr = MockShadowRoot()
        mock_find = AsyncMock(return_value=[non_cf_sr])

        # Simulate time progressing past the timeout
        time_values = iter([0, 0.5, 1.0, 100.0])

        mock_loop = MagicMock()
        mock_loop.time = lambda: next(time_values)

        with patch.object(tab, 'find_shadow_roots', mock_find):
            with patch('asyncio.get_event_loop', return_value=mock_loop):
                with patch('asyncio.sleep', AsyncMock()):
                    with pytest.raises(WaitElementTimeout, match='Timed out'):
                        await tab._find_cloudflare_shadow_root(timeout=5)


class TestTabDownload:
    """Tests for Tab.expect_download context manager."""

    @pytest.mark.asyncio
    async def test_expect_download_keeps_file_when_path_provided(self, tab, tmp_path):
        target_dir = tmp_path / "dl"
        tab._browser.set_download_behavior = AsyncMock()

        # Prepare to capture callbacks and trigger them
        handlers = {}

        async def fake_on(event_name, handler, temporary=False):
            handlers[event_name] = handler
            return 100 if event_name == PageEvent.DOWNLOAD_WILL_BEGIN else 101

        with patch.object(tab, 'on', fake_on):
            async with tab.expect_download(keep_file_at=str(target_dir)) as download:
                # Simulate willBegin
                await handlers[PageEvent.DOWNLOAD_WILL_BEGIN]({
                    'method': PageEvent.DOWNLOAD_WILL_BEGIN,
                    'params': {
                        'frameId': 'frame-1',
                        'guid': 'guid-1',
                        'url': 'https://example.com/file.txt',
                        'suggestedFilename': 'file.txt',
                    }
                })
                # Simulate progress Completed without filePath (fallback to suggested)
                await handlers[PageEvent.DOWNLOAD_PROGRESS]({
                    'method': PageEvent.DOWNLOAD_PROGRESS,
                    'params': {
                        'guid': 'guid-1',
                        'totalBytes': 10,
                        'receivedBytes': 10,
                        'state': 'completed',
                    }
                })

                # Create the expected file to allow read
                expected_path = target_dir / 'file.txt'
                expected_path.parent.mkdir(parents=True, exist_ok=True)
                expected_path.write_bytes(b'content')

                data = await download.read_bytes()
                assert data == b'content'
                assert str(download.file_path).endswith('file.txt')

        # Ensure behavior reset called
        tab._browser.set_download_behavior.assert_awaited()

    @pytest.mark.asyncio
    async def test_expect_download_timeout_raises(self, tab, tmp_path):
        tab._browser.set_download_behavior = AsyncMock()

        handlers = {}

        async def fake_on(event_name, handler, temporary=False):
            handlers[event_name] = handler
            return 200 if event_name == PageEvent.DOWNLOAD_WILL_BEGIN else 201

        with patch.object(tab, 'on', fake_on):
            with pytest.raises(DownloadTimeout):
                async with tab.expect_download(keep_file_at=str(tmp_path), timeout=0.01):
                    # Trigger will begin but never complete
                    await handlers[PageEvent.DOWNLOAD_WILL_BEGIN]({
                        'method': PageEvent.DOWNLOAD_WILL_BEGIN,
                        'params': {
                            'frameId': 'frame-1',
                            'guid': 'guid-2',
                            'url': 'https://example.com/slow.bin',
                            'suggestedFilename': 'slow.bin',
                        }
                    })
                    # Do not trigger completed
                    await asyncio.sleep(0.02)

    @pytest.mark.asyncio
    async def test_expect_download_cleans_temp_directory(self, tab, tmp_path):
        tab._browser.set_download_behavior = AsyncMock()
        handlers = {}

        async def fake_on(event_name, handler, temporary=False):
            handlers[event_name] = handler
            return 300 if event_name == PageEvent.DOWNLOAD_WILL_BEGIN else 301

        with patch.object(tab, 'on', fake_on):
            # Use None to create temp dir and ensure cleanup occurs
            async with tab.expect_download(keep_file_at=None) as download:
                await handlers[PageEvent.DOWNLOAD_WILL_BEGIN]({
                    'method': PageEvent.DOWNLOAD_WILL_BEGIN,
                    'params': {
                        'frameId': 'frame-1',
                        'guid': 'guid-3',
                        'url': 'https://example.com/tmp.txt',
                        'suggestedFilename': 'tmp.txt',
                    }
                })
                await handlers[PageEvent.DOWNLOAD_PROGRESS]({
                    'method': PageEvent.DOWNLOAD_PROGRESS,
                    'params': {
                        'guid': 'guid-3',
                        'totalBytes': 3,
                        'receivedBytes': 3,
                        'state': 'completed',
                    }
                })

                # Create the expected file inside the dynamically chosen dir
                assert download.file_path is not None
                file_path = Path(download.file_path)
                file_path.parent.mkdir(parents=True, exist_ok=True)
                file_path.write_bytes(b'abc')
                assert (await download.read_base64()) == base64.b64encode(b'abc').decode('ascii')

            # After context, temp dir should be removed
            # We cannot know the exact temp dir path (random), but ensure file is gone
            assert not file_path.exists()

    @pytest.mark.asyncio
    async def test_expect_download_ignores_progress_with_different_guid(self, tab, tmp_path):
        tab._browser.set_download_behavior = AsyncMock()

        handlers = {}

        async def fake_on(event_name, handler, temporary=False):
            handlers[event_name] = handler
            return 400 if event_name == PageEvent.DOWNLOAD_WILL_BEGIN else 401

        with patch.object(tab, 'on', fake_on):
            async with tab.expect_download(keep_file_at=str(tmp_path)) as download:
                await handlers[PageEvent.DOWNLOAD_WILL_BEGIN]({
                    'method': PageEvent.DOWNLOAD_WILL_BEGIN,
                    'params': {
                        'frameId': 'frame-1',
                        'guid': 'guid-x',
                        'url': 'https://example.com/file.bin',
                        'suggestedFilename': 'file.bin',
                    }
                })

                # Wrong guid should be ignored and not mark as done
                await handlers[PageEvent.DOWNLOAD_PROGRESS]({
                    'method': PageEvent.DOWNLOAD_PROGRESS,
                    'params': {
                        'guid': 'wrong-guid',
                        'totalBytes': 1,
                        'receivedBytes': 1,
                        'state': 'completed',
                    }
                })

                # Still not finished
                assert download.file_path is None

                # Correct guid completes
                await handlers[PageEvent.DOWNLOAD_PROGRESS]({
                    'method': PageEvent.DOWNLOAD_PROGRESS,
                    'params': {
                        'guid': 'guid-x',
                        'totalBytes': 10,
                        'receivedBytes': 10,
                        'state': 'completed',
                        'filePath': str(tmp_path / 'file.bin'),
                    }
                })

                await download.wait_finished()

    @pytest.mark.asyncio
    async def test_expect_download_page_events_auto_enable_disable(self, tab, tmp_path):
        """When page events are disabled, expect_download should enable and then disable them."""
        tab._browser.set_download_behavior = AsyncMock()
        tab._page_events_enabled = False

        enable_page_events = AsyncMock()
        disable_page_events = AsyncMock()

        handlers = {}

        async def fake_on(event_name, handler, temporary=False):
            handlers[event_name] = handler
            return 500 if event_name == PageEvent.DOWNLOAD_WILL_BEGIN else 501

        with patch.object(tab, 'enable_page_events', enable_page_events), \
             patch.object(tab, 'disable_page_events', disable_page_events), \
             patch.object(tab, 'on', fake_on):
            async with tab.expect_download(keep_file_at=str(tmp_path)):
                await handlers[PageEvent.DOWNLOAD_WILL_BEGIN]({
                    'method': PageEvent.DOWNLOAD_WILL_BEGIN,
                    'params': {
                        'frameId': 'frame-1',
                        'guid': 'guid-y',
                        'url': 'https://example.com/auto.bin',
                        'suggestedFilename': 'auto.bin',
                    }
                })
                await handlers[PageEvent.DOWNLOAD_PROGRESS]({
                    'method': PageEvent.DOWNLOAD_PROGRESS,
                    'params': {
                        'guid': 'guid-y',
                        'totalBytes': 2,
                        'receivedBytes': 2,
                        'state': 'completed',
                        'filePath': str(tmp_path / 'auto.bin'),
                    }
                })

        enable_page_events.assert_awaited_once()
        disable_page_events.assert_awaited_once()

    @pytest.mark.asyncio
    async def test_expect_download_keeps_page_events_enabled_when_already_enabled(self, tab, tmp_path):
        """When page events already enabled, expect_download should not disable them on exit."""
        tab._browser.set_download_behavior = AsyncMock()
        tab._page_events_enabled = True

        enable_page_events = AsyncMock()
        disable_page_events = AsyncMock()

        handlers = {}

        async def fake_on(event_name, handler, temporary=False):
            handlers[event_name] = handler
            return 600 if event_name == PageEvent.DOWNLOAD_WILL_BEGIN else 601

        with patch.object(tab, 'enable_page_events', enable_page_events), \
             patch.object(tab, 'disable_page_events', disable_page_events), \
             patch.object(tab, 'on', fake_on):
            async with tab.expect_download(keep_file_at=str(tmp_path)):
                await handlers[PageEvent.DOWNLOAD_WILL_BEGIN]({
                    'method': PageEvent.DOWNLOAD_WILL_BEGIN,
                    'params': {
                        'frameId': 'frame-1',
                        'guid': 'guid-z',
                        'url': 'https://example.com/enabled.bin',
                        'suggestedFilename': 'enabled.bin',
                    }
                })
                await handlers[PageEvent.DOWNLOAD_PROGRESS]({
                    'method': PageEvent.DOWNLOAD_PROGRESS,
                    'params': {
                        'guid': 'guid-z',
                        'totalBytes': 2,
                        'receivedBytes': 2,
                        'state': 'completed',
                        'filePath': str(tmp_path / 'enabled.bin'),
                    }
                })

        enable_page_events.assert_not_awaited()
        disable_page_events.assert_not_awaited()


class TestTabFrameHandling:
    """Test Tab iframe handling methods."""

    @pytest.mark.asyncio
    async def test_get_frame_success(self, tab, mock_browser):
        """Test getting frame from iframe element."""
        mock_iframe_element = MagicMock()
        mock_iframe_element.tag_name = 'iframe'
        mock_iframe_element.get_attribute.return_value = 'https://example.com/iframe'
        mock_iframe_element._object_id = 'iframe-object-id'
        
        mock_browser.get_targets = AsyncMock(return_value=[
            {'targetId': 'iframe-target-id', 'url': 'https://example.com/iframe'}
        ])

        with pytest.warns(DeprecationWarning):
            frame = await tab.get_frame(mock_iframe_element)
        
        assert isinstance(frame, Tab)
        mock_browser.get_targets.assert_called_once()

    @pytest.mark.asyncio
    async def test_get_frame_uses_cache_on_subsequent_calls(self, tab, mock_browser):
        """Subsequent calls to get_frame should return cached Tab instance."""
        # Prepare iframe element
        mock_iframe_element = MagicMock()
        mock_iframe_element.tag_name = 'iframe'
        frame_url = 'https://example.com/iframe'
        mock_iframe_element.get_attribute.return_value = frame_url
        # Prepare browser targets and cache
        mock_browser.get_targets = AsyncMock(return_value=[
            {'targetId': 'iframe-target-id', 'url': frame_url, 'type': 'page'}
        ])
        tab._browser._tabs_opened = {}

        with patch('pydoll.browser.tab.ConnectionHandler', autospec=True):
            with pytest.warns(DeprecationWarning):
                frame1 = await tab.get_frame(mock_iframe_element)
            # Second call should reuse from cache and not create a new Tab
            with pytest.warns(DeprecationWarning):
                frame2 = await tab.get_frame(mock_iframe_element)

        assert isinstance(frame1, Tab)
        assert frame1 is frame2
        assert tab._browser._tabs_opened['iframe-target-id'] is frame1

    @pytest.mark.asyncio
    async def test_get_frame_not_iframe(self, tab):
        """Test getting frame from non-iframe element."""
        mock_element = MagicMock()
        mock_element.tag_name = 'div'  # Mock the property directly
        
        with pytest.warns(DeprecationWarning):
            with pytest.raises(NotAnIFrame):
                await tab.get_frame(mock_element)

    @pytest.mark.asyncio
    async def test_get_frame_no_frame_id(self, tab, mock_browser):
        """Test getting frame when no frame ID is found."""
        mock_iframe_element = MagicMock()
        mock_iframe_element.tag_name = 'iframe'  # Mock the _attributes dict
        mock_iframe_element.get_attribute.return_value = 'https://example.com/iframe'
        mock_iframe_element._object_id = 'iframe-object-id'

        mock_browser.get_targets = AsyncMock(return_value=[])
        
        with pytest.warns(DeprecationWarning):
            with pytest.raises(IFrameNotFound):
                await tab.get_frame(mock_iframe_element)


class TestTabUtilityMethods:
    """Test Tab utility and helper methods."""

    @pytest.mark.asyncio
    async def test_bring_to_front(self, tab):
        """Test bringing the tab to front sends the correct command."""
        with patch.object(tab, '_execute_command', AsyncMock()) as mock_execute:
            await tab.bring_to_front()

            mock_execute.assert_called_once()
            command = mock_execute.call_args[0][0]
            assert command['method'] == 'Page.bringToFront'

    @pytest.mark.asyncio
    async def test_close(self, tab, mock_browser):
        """Test closing the tab."""
        with patch.object(tab, '_execute_command', AsyncMock()) as mock_execute:
            await tab.close()
            
            # Should call _execute_command with PageCommands.close()
            mock_execute.assert_called_once()

    @pytest.mark.asyncio
    async def test_wait_page_load_complete(self, tab):
        """Test _wait_page_load waits for LOAD_EVENT_FIRED via CDP events."""
        tab._connection_handler.execute_command.return_value = {'result': {}}

        async def fire_callback(event_name, callback, temporary=False):
            callback({'method': event_name, 'params': {}})
            return 1

        tab._connection_handler.register_callback = AsyncMock(side_effect=fire_callback)

        async with tab._wait_page_load():
            pass

        tab._connection_handler.register_callback.assert_called_once()
        call_args = tab._connection_handler.register_callback.call_args
        assert call_args[0][0] == PageEvent.LOAD_EVENT_FIRED

    @pytest.mark.asyncio
    async def test_wait_page_load_interactive(self, tab):
        """Test _wait_page_load waits for DOM_CONTENT_EVENT_FIRED when
        page_load_state is INTERACTIVE."""
        tab._browser.options.page_load_state = PageLoadState.INTERACTIVE
        tab._connection_handler.execute_command.return_value = {'result': {}}

        async def fire_callback(event_name, callback, temporary=False):
            callback({'method': event_name, 'params': {}})
            return 1

        tab._connection_handler.register_callback = AsyncMock(side_effect=fire_callback)

        async with tab._wait_page_load():
            pass

        tab._connection_handler.register_callback.assert_called_once()
        call_args = tab._connection_handler.register_callback.call_args
        assert call_args[0][0] == PageEvent.DOM_CONTENT_EVENT_FIRED

    @pytest.mark.asyncio
    async def test_wait_page_load_timeout(self, tab):
        """Test _wait_page_load raises PageLoadTimeout on timeout."""
        tab._connection_handler.execute_command.return_value = {'result': {}}
        tab._connection_handler.register_callback = AsyncMock(return_value=1)

        with pytest.raises(PageLoadTimeout):
            async with tab._wait_page_load(timeout=0.1):
                pass

    @pytest.mark.asyncio
    async def test_wait_page_load_cleans_up_page_events(self, tab):
        """Test _wait_page_load enables/disables page events when needed."""
        assert tab._page_events_enabled is False
        tab._connection_handler.execute_command.return_value = {'result': {}}

        async def fire_callback(event_name, callback, temporary=False):
            callback({'method': event_name, 'params': {}})
            return 1

        tab._connection_handler.register_callback = AsyncMock(side_effect=fire_callback)

        async with tab._wait_page_load():
            assert tab._page_events_enabled is True

        assert tab._page_events_enabled is False

    @pytest.mark.asyncio
    async def test_refresh_if_url_not_changed_same_url(self, tab):
        """Test _refresh_if_url_not_changed with same URL."""
        tab._connection_handler.execute_command.side_effect = [
            {'result': {'result': {'value': 'https://example.com'}}},  # current_url call
            {'result': {}},  # Page.enable
            {'result': {}},  # refresh call
            {'result': {}},  # Page.disable
        ]

        async def fire_callback(event_name, callback, temporary=False):
            callback({'method': event_name, 'params': {}})
            return 1

        tab._connection_handler.register_callback = AsyncMock(side_effect=fire_callback)

        result = await tab._refresh_if_url_not_changed('https://example.com')

        assert result is True
        assert tab._connection_handler.execute_command.call_count == 4

    @pytest.mark.asyncio
    async def test_refresh_if_url_not_changed_different_url(self, tab):
        """Test _refresh_if_url_not_changed with different URL."""
        tab._connection_handler.execute_command.return_value = {
            'result': {'result': {'value': 'https://different.com'}}
        }
        
        result = await tab._refresh_if_url_not_changed('https://example.com')
        
        assert result is False
        assert_mock_called_at_least_once(tab._connection_handler)


class TestTabRequestManagement:
    """Test Tab request management methods."""

    @pytest.mark.asyncio
    async def test_continue_request(self, tab):
        """Test continue_request method with minimal parameters."""
        request_id = 'test_request_123'
        
        await tab.continue_request(request_id)
        
        # Verify the command was executed with correct parameters
        assert_mock_called_at_least_once(tab._connection_handler)
        
        # Get the call arguments to verify the command
        call_args = tab._connection_handler.execute_command.call_args_list[-1]
        command = call_args[0][0]  # First argument is the command
        
        # Verify it's a FetchCommands.continue_request command
        assert command['method'] == 'Fetch.continueRequest'
        assert command['params']['requestId'] == request_id
        # Verify optional parameters are None/not set
        params = command['params']
        assert params.get('url') is None
        assert params.get('method') is None
        assert params.get('postData') is None
        assert params.get('headers') is None
        assert params.get('interceptResponse') is None

    @pytest.mark.asyncio
    async def test_fail_request(self, tab):
        """Test fail_request method."""
        from pydoll.protocol.network.types import ErrorReason
        
        request_id = 'test_request_456'
        error_reason = ErrorReason.FAILED
        
        await tab.fail_request(request_id, error_reason)
        
        # Verify the command was executed with correct parameters
        assert_mock_called_at_least_once(tab._connection_handler)
        
        # Get the call arguments to verify the command
        call_args = tab._connection_handler.execute_command.call_args_list[-1]
        command = call_args[0][0]  # First argument is the command
        
        # Verify it's a FetchCommands.fail_request command
        assert command['method'] == 'Fetch.failRequest'
        assert command['params']['requestId'] == request_id
        assert command['params']['errorReason'] == error_reason

    @pytest.mark.asyncio
    async def test_fulfill_request(self, tab):
        """Test fulfill_request method with minimal parameters."""
        request_id = 'test_request_789'
        response_code = 200
        
        await tab.fulfill_request(request_id, response_code)
        
        # Verify the command was executed with correct parameters
        assert_mock_called_at_least_once(tab._connection_handler)
        
        # Get the call arguments to verify the command
        call_args = tab._connection_handler.execute_command.call_args_list[-1]
        command = call_args[0][0]  # First argument is the command
        
        # Verify it's a FetchCommands.fulfill_request command
        assert command['method'] == 'Fetch.fulfillRequest'
        assert command['params']['requestId'] == request_id
        assert command['params']['responseCode'] == response_code
        # Verify optional parameters are None/not set
        params = command['params']
        assert params.get('responseHeaders') is None
        assert params.get('body') is None
        assert params.get('responsePhrase') is None

    @pytest.mark.asyncio
    async def test_continue_request_with_all_params(self, tab):
        """Test continue_request with all parameters."""
        from pydoll.protocol.network.types import RequestMethod
        
        request_id = 'test_request_456'
        url = 'https://modified-example.com'
        method = RequestMethod.POST
        post_data = 'modified_data=test'
        headers = [{'name': 'Authorization', 'value': 'Bearer token123'}]
        intercept_response = True
        
        await tab.continue_request(
            request_id=request_id,
            url=url,
            method=method,
            post_data=post_data,
            headers=headers,
            intercept_response=intercept_response,
        )
        
        # Verify the command was executed with correct parameters
        assert_mock_called_at_least_once(tab._connection_handler)
        
        # Get the call arguments to verify the command
        call_args = tab._connection_handler.execute_command.call_args_list[-1]
        command = call_args[0][0]  # First argument is the command
        
        # Verify all parameters
        params = command['params']
        assert params['requestId'] == request_id
        assert params['url'] == url
        assert params['method'] == method
        assert params['postData'] == post_data
        assert params['headers'] == headers
        assert params['interceptResponse'] == intercept_response

    @pytest.mark.asyncio
    async def test_continue_request_with_different_id(self, tab):
        """Test continue_request with different request ID."""
        request_id = 'another_request_id_xyz'
        
        await tab.continue_request(request_id)
        
        assert_mock_called_at_least_once(tab._connection_handler)
        
        # Verify the request ID was passed correctly
        call_args = tab._connection_handler.execute_command.call_args_list[-1]
        command = call_args[0][0]
        assert command['params']['requestId'] == request_id

    @pytest.mark.asyncio
    async def test_fail_request_with_different_error(self, tab):
        """Test fail_request with different error reason."""
        from pydoll.protocol.network.types import ErrorReason
        
        request_id = 'test_request_error'
        error_reason = ErrorReason.ABORTED
        
        await tab.fail_request(request_id, error_reason)
        
        assert_mock_called_at_least_once(tab._connection_handler)
        
        # Verify the error reason was passed correctly
        call_args = tab._connection_handler.execute_command.call_args_list[-1]
        command = call_args[0][0]
        assert command['params']['errorReason'] == error_reason

    @pytest.mark.asyncio
    async def test_fulfill_request_with_all_params(self, tab):
        """Test fulfill_request with all parameters."""
        request_id = 'test_request_complete'
        response_code = 200
        response_headers = [{'name': 'Content-Type', 'value': 'application/json'}]
        json_response = '{"status": "success", "data": "test"}'
        body = base64.b64encode(json_response.encode('utf-8')).decode('utf-8')
        response_phrase = 'OK'
        
        await tab.fulfill_request(
            request_id=request_id,
            response_code=response_code,
            response_headers=response_headers,
            body=body,
            response_phrase=response_phrase,
        )
        
        # Verify the command was executed with correct parameters
        assert_mock_called_at_least_once(tab._connection_handler)
        
        # Get the call arguments to verify the command
        call_args = tab._connection_handler.execute_command.call_args_list[-1]
        command = call_args[0][0]  # First argument is the command
        
        # Verify all parameters
        params = command['params']
        assert params['requestId'] == request_id
        assert params['responseCode'] == response_code
        assert params['responseHeaders'] == response_headers
        assert params['body'] == body
        assert params['responsePhrase'] == response_phrase

    @pytest.mark.asyncio
    async def test_fulfill_request_with_different_status_code(self, tab):
        """Test fulfill_request with different status code."""
        request_id = 'test_request_404'
        response_code = 404
        response_headers = [{'name': 'Content-Type', 'value': 'text/html'}]
        html_response = '<html><body><h1>404 - Not Found</h1></body></html>'
        response_body = base64.b64encode(html_response.encode('utf-8')).decode('utf-8')
        
        await tab.fulfill_request(
            request_id, response_code, response_headers, response_body
        )
        
        assert_mock_called_at_least_once(tab._connection_handler)
        
        # Verify all parameters were passed correctly
        call_args = tab._connection_handler.execute_command.call_args_list[-1]
        command = call_args[0][0]
        assert command['params']['responseCode'] == response_code
        assert command['params']['responseHeaders'] == response_headers
        assert command['params']['body'] == response_body

    @pytest.mark.asyncio
    async def test_fulfill_request_empty_headers(self, tab):
        """Test fulfill_request with empty headers."""
        request_id = 'test_request_empty_headers'
        response_code = 200
        response_headers = []
        json_response = '{"message": "success"}'
        response_body = base64.b64encode(json_response.encode('utf-8')).decode('utf-8')
        
        await tab.fulfill_request(
            request_id, response_code, response_headers, response_body
        )
        
        assert_mock_called_at_least_once(tab._connection_handler)
        
        # Verify empty headers are handled correctly
        call_args = tab._connection_handler.execute_command.call_args_list[-1]
        command = call_args[0][0]
        assert command['params']['responseHeaders'] == []
        assert command['params']['body'] == response_body


class TestTabEdgeCases:
    """Test Tab edge cases and error conditions."""

    @pytest.mark.asyncio
    async def test_take_screenshot_invalid_extension(self, tab):
        """Test take_screenshot with invalid file extension."""
        with pytest.raises(InvalidFileExtension):
            await tab.take_screenshot('screenshot.txt')

    @pytest.mark.asyncio
    async def test_print_to_pdf_with_invalid_path(self, tab):
        """Test print_to_pdf with missing path when not using base64."""
        # Mock the response
        tab._connection_handler.execute_command.return_value = {
            'result': {'data': 'JVBERi0xLjQKJdPr6eEKMSAwIG9iago8PAovVHlwZSAvQ2F0YWxvZwo+PgplbmRvYmoKdHJhaWxlcgo8PAovUm9vdCAxIDAgUgo+PgpzdGFydHhyZWYKMTgKJSVFT0Y='}
        }
        
        # Should raise ValueError when path is not provided and as_base64=False
        with pytest.raises(ValueError, match="path is required when as_base64=False"):
            await tab.print_to_pdf(as_base64=False)

    @pytest.mark.asyncio
    async def test_network_logs_property(self, tab):
        """Test network_logs property access."""
        test_logs = [{'request': {'url': 'https://example.com'}}]
        tab._connection_handler.network_logs = test_logs
        
        logs = tab._connection_handler.network_logs
        assert logs == test_logs

    @pytest.mark.asyncio
    async def test_dialog_property(self, tab):
        """Test dialog property access."""
        test_dialog = {'type': 'alert', 'message': 'Test message'}
        tab._connection_handler.dialog = test_dialog
        
        dialog = tab._connection_handler.dialog
        assert dialog == test_dialog


class TestTabNetworkMethods:
    """Test Tab network-related methods."""

    @pytest.mark.asyncio
    async def test_get_network_response_body_success(self, tab):
        """Test get_network_response_body with network events enabled."""
        # Enable network events
        tab._network_events_enabled = True
        
        # Mock the response
        expected_body = '<html><body>Response content</body></html>'
        tab._connection_handler.execute_command.return_value = {
            'result': {'body': expected_body}
        }
        
        result = await tab.get_network_response_body('test_request_123')
        
        assert result == expected_body
        assert_mock_called_at_least_once(tab._connection_handler)

    @pytest.mark.asyncio
    async def test_get_network_response_body_events_not_enabled(self, tab):
        """Test get_network_response_body when network events are not enabled."""
        # Ensure network events are disabled
        tab._network_events_enabled = False
        
        with pytest.raises(NetworkEventsNotEnabled) as exc_info:
            await tab.get_network_response_body('test_request_123')
        
        assert str(exc_info.value) == 'Network events must be enabled to get response body'
        tab._connection_handler.execute_command.assert_not_called()

    @pytest.mark.asyncio
    async def test_get_network_logs_success_no_filter(self, tab):
        """Test get_network_logs without filter."""
        # Enable network events
        tab._network_events_enabled = True
        
        # Mock network logs
        test_logs = [
            {
                'method': 'Network.requestWillBeSent',
                'params': {
                    'request': {'url': 'https://example.com/api/data'},
                    'requestId': 'req_1'
                }
            },
            {
                'method': 'Network.responseReceived',
                'params': {
                    'request': {'url': 'https://example.com/static/style.css'},
                    'requestId': 'req_2'
                }
            }
        ]
        tab._connection_handler.network_logs = test_logs
        
        result = await tab.get_network_logs()
        
        assert result == test_logs
        assert len(result) == 2

    @pytest.mark.asyncio
    async def test_get_network_logs_success_with_filter(self, tab):
        """Test get_network_logs with URL filter."""
        # Enable network events
        tab._network_events_enabled = True
        
        # Mock network logs
        test_logs = [
            {
                'method': 'Network.requestWillBeSent',
                'params': {
                    'request': {'url': 'https://example.com/api/data'},
                    'requestId': 'req_1'
                }
            },
            {
                'method': 'Network.responseReceived',
                'params': {
                    'request': {'url': 'https://example.com/static/style.css'},
                    'requestId': 'req_2'
                }
            },
            {
                'method': 'Network.requestWillBeSent',
                'params': {
                    'request': {'url': 'https://api.example.com/users'},
                    'requestId': 'req_3'
                }
            }
        ]
        tab._connection_handler.network_logs = test_logs
        
        result = await tab.get_network_logs(filter='api')
        
        # Should return only logs with 'api' in the URL
        assert len(result) == 2
        assert result[0]['params']['request']['url'] == 'https://example.com/api/data'
        assert result[1]['params']['request']['url'] == 'https://api.example.com/users'

    @pytest.mark.asyncio
    async def test_get_network_logs_empty_filter_result(self, tab):
        """Test get_network_logs with filter that matches no logs."""
        # Enable network events
        tab._network_events_enabled = True
        
        # Mock network logs
        test_logs = [
            {
                'method': 'Network.requestWillBeSent',
                'params': {
                    'request': {'url': 'https://example.com/static/style.css'},
                    'requestId': 'req_1'
                }
            }
        ]
        tab._connection_handler.network_logs = test_logs
        
        result = await tab.get_network_logs(filter='nonexistent')
        
        assert result == []

    @pytest.mark.asyncio
    async def test_get_network_logs_events_not_enabled(self, tab):
        """Test get_network_logs when network events are not enabled."""
        # Ensure network events are disabled
        tab._network_events_enabled = False
        
        with pytest.raises(NetworkEventsNotEnabled) as exc_info:
            await tab.get_network_logs()
        
        assert str(exc_info.value) == 'Network events must be enabled to get network logs'

    @pytest.mark.asyncio
    async def test_get_network_logs_missing_request_params(self, tab):
        """Test get_network_logs with logs missing request parameters."""
        # Enable network events
        tab._network_events_enabled = True
        
        # Mock network logs with missing request data
        test_logs = [
            {
                'method': 'Network.requestWillBeSent',
                'params': {
                    'requestId': 'req_1'
                    # Missing 'request' key
                }
            },
            {
                'method': 'Network.responseReceived',
                'params': {
                    'request': {},  # Empty request object
                    'requestId': 'req_2'
                }
            }
        ]
        tab._connection_handler.network_logs = test_logs

        result = await tab.get_network_logs(filter='example')

        # Should handle missing request data gracefully
        assert result == []


class TestTabSaveBundle:
    """Tests for Tab.save_bundle() page bundle export."""

    @pytest.fixture(autouse=True)
    def _enable_page_events(self, tab):
        """Pre-enable page events so save_bundle skips enable/disable calls."""
        tab._page_events_enabled = True

    def _make_frame_tree(self, frame_id='F1', page_url='https://example.com/',
                          resources=None, child_frames=None):
        tree = {
            'frame': {
                'id': frame_id,
                'url': page_url,
                'loaderId': 'L1',
                'domainAndRegistry': 'example.com',
                'securityOrigin': 'https://example.com',
                'mimeType': 'text/html',
                'secureContextType': 'Secure',
                'crossOriginIsolatedContextType': 'NotIsolated',
                'gatedAPIFeatures': [],
            },
            'resources': resources or [],
        }
        if child_frames:
            tree['childFrames'] = child_frames
        return tree

    def _make_resource(self, url, rtype='Stylesheet', mime='text/css',
                        failed=False, canceled=False):
        res = {'url': url, 'type': rtype, 'mimeType': mime}
        if failed:
            res['failed'] = True
        if canceled:
            res['canceled'] = True
        return res

    @pytest.mark.asyncio
    async def test_save_bundle_invalid_extension(self, tab):
        with pytest.raises(InvalidFileExtension, match=r'\.zip'):
            await tab.save_bundle('output.tar.gz')

    @pytest.mark.asyncio
    async def test_save_bundle_separate_assets(self, tab, tmp_path):
        page_url = 'https://example.com/'
        css_url = 'https://example.com/style.css'
        js_url = 'https://example.com/app.js'

        resources = [
            self._make_resource(css_url, 'Stylesheet', 'text/css'),
            self._make_resource(js_url, 'Script', 'text/javascript'),
        ]
        frame_tree = self._make_frame_tree(resources=resources)

        html_content = (
            '<html><head>'
            f'<link rel="stylesheet" href="{css_url}">'
            f'<script src="{js_url}"></script>'
            '</head><body>Hello</body></html>'
        )
        css_content = 'body { color: red; }'
        js_content = 'console.log("hi");'

        responses = [
            {'result': {'frameTree': frame_tree}},
            {'result': {'content': html_content, 'base64Encoded': False}},
            {'result': {'content': css_content, 'base64Encoded': False}},
            {'result': {'content': js_content, 'base64Encoded': False}},
        ]
        tab._connection_handler.execute_command = AsyncMock(side_effect=responses)

        zip_path = tmp_path / 'bundle.zip'
        await tab.save_bundle(str(zip_path))

        assert zip_path.exists()
        import zipfile
        with zipfile.ZipFile(zip_path) as zf:
            names = zf.namelist()
            assert 'index.html' in names
            assert any('style.css' in n for n in names)
            assert any('app.js' in n for n in names)
            index = zf.read('index.html').decode('utf-8')
            assert 'assets/' in index
            assert css_url not in index

    @pytest.mark.asyncio
    async def test_save_bundle_inline_assets(self, tab, tmp_path):
        page_url = 'https://example.com/'
        css_url = 'https://example.com/style.css'
        js_url = 'https://example.com/app.js'
        img_url = 'https://example.com/logo.png'

        resources = [
            self._make_resource(css_url, 'Stylesheet', 'text/css'),
            self._make_resource(js_url, 'Script', 'text/javascript'),
            self._make_resource(img_url, 'Image', 'image/png'),
        ]
        frame_tree = self._make_frame_tree(resources=resources)

        html_content = (
            '<html><head>'
            f'<link rel="stylesheet" href="{css_url}">'
            f'<script src="{js_url}"></script>'
            '</head><body>'
            f'<img src="{img_url}">'
            '</body></html>'
        )
        css_content = 'body { color: red; }'
        js_content = 'console.log("hi");'
        img_b64 = base64.b64encode(b'\x89PNG').decode()

        responses = [
            {'result': {'frameTree': frame_tree}},
            {'result': {'content': html_content, 'base64Encoded': False}},
            {'result': {'content': css_content, 'base64Encoded': False}},
            {'result': {'content': js_content, 'base64Encoded': False}},
            {'result': {'content': img_b64, 'base64Encoded': True}},
        ]
        tab._connection_handler.execute_command = AsyncMock(side_effect=responses)

        zip_path = tmp_path / 'bundle.zip'
        await tab.save_bundle(str(zip_path), inline_assets=True)

        import zipfile
        with zipfile.ZipFile(zip_path) as zf:
            names = zf.namelist()
            assert names == ['index.html']
            index = zf.read('index.html').decode('utf-8')
            assert '<style>' in index
            assert '<script>' in index
            assert 'data:image/png;base64,' in index

    @pytest.mark.asyncio
    async def test_save_bundle_skips_failed_resources(self, tab, tmp_path):
        page_url = 'https://example.com/'
        resources = [
            self._make_resource('https://example.com/ok.css', 'Stylesheet', 'text/css'),
            self._make_resource('https://example.com/bad.css', 'Stylesheet', 'text/css',
                                failed=True),
        ]
        frame_tree = self._make_frame_tree(resources=resources)

        html = '<html><head></head><body></body></html>'
        responses = [
            {'result': {'frameTree': frame_tree}},
            {'result': {'content': html, 'base64Encoded': False}},
            {'result': {'content': 'body{}', 'base64Encoded': False}},
        ]
        tab._connection_handler.execute_command = AsyncMock(side_effect=responses)

        zip_path = tmp_path / 'bundle.zip'
        await tab.save_bundle(str(zip_path))

        # Only 3 calls: getResourceTree, getResourceContent(doc), getResourceContent(ok.css)
        assert tab._connection_handler.execute_command.call_count == 3

    @pytest.mark.asyncio
    async def test_save_bundle_handles_fetch_exceptions(self, tab, tmp_path):
        page_url = 'https://example.com/'
        resources = [
            self._make_resource('https://example.com/style.css', 'Stylesheet', 'text/css'),
        ]
        frame_tree = self._make_frame_tree(resources=resources)
        html = '<html><body></body></html>'

        responses = [
            {'result': {'frameTree': frame_tree}},
            {'result': {'content': html, 'base64Encoded': False}},
            RuntimeError('fetch failed'),
        ]
        tab._connection_handler.execute_command = AsyncMock(side_effect=responses)

        zip_path = tmp_path / 'bundle.zip'
        await tab.save_bundle(str(zip_path))

        import zipfile
        with zipfile.ZipFile(zip_path) as zf:
            assert 'index.html' in zf.namelist()
            assert not any(n.startswith('assets/') for n in zf.namelist())

    @pytest.mark.asyncio
    async def test_save_bundle_handles_cdp_error_responses(self, tab, tmp_path):
        """CDP returns {'error': ...} instead of {'result': ...} for some resources."""
        resources = [
            self._make_resource('https://example.com/style.css', 'Stylesheet', 'text/css'),
        ]
        frame_tree = self._make_frame_tree(resources=resources)
        html = '<html><body></body></html>'

        responses = [
            {'result': {'frameTree': frame_tree}},
            {'result': {'content': html, 'base64Encoded': False}},
            {'error': {'code': -32000, 'message': 'No resource with given URL'}},
        ]
        tab._connection_handler.execute_command = AsyncMock(side_effect=responses)

        zip_path = tmp_path / 'bundle.zip'
        await tab.save_bundle(str(zip_path))

        import zipfile
        with zipfile.ZipFile(zip_path) as zf:
            assert 'index.html' in zf.namelist()
            assert not any(n.startswith('assets/') for n in zf.namelist())

    @pytest.mark.asyncio
    async def test_save_bundle_empty_resources(self, tab, tmp_path):
        frame_tree = self._make_frame_tree(resources=[])
        html = '<html><body>Hello</body></html>'

        responses = [
            {'result': {'frameTree': frame_tree}},
            {'result': {'content': html, 'base64Encoded': False}},
        ]
        tab._connection_handler.execute_command = AsyncMock(side_effect=responses)

        zip_path = tmp_path / 'bundle.zip'
        await tab.save_bundle(str(zip_path))

        import zipfile
        with zipfile.ZipFile(zip_path) as zf:
            assert zf.namelist() == ['index.html']
            assert zf.read('index.html').decode() == html

    @pytest.mark.asyncio
    async def test_save_bundle_base64_encoded_resource(self, tab, tmp_path):
        page_url = 'https://example.com/'
        img_url = 'https://example.com/image.png'
        resources = [
            self._make_resource(img_url, 'Image', 'image/png'),
        ]
        frame_tree = self._make_frame_tree(resources=resources)
        html = f'<html><body><img src="{img_url}"></body></html>'
        img_bytes = b'\x89PNG\r\n\x1a\n' + b'\x00' * 16
        img_b64 = base64.b64encode(img_bytes).decode()

        responses = [
            {'result': {'frameTree': frame_tree}},
            {'result': {'content': html, 'base64Encoded': False}},
            {'result': {'content': img_b64, 'base64Encoded': True}},
        ]
        tab._connection_handler.execute_command = AsyncMock(side_effect=responses)

        zip_path = tmp_path / 'bundle.zip'
        await tab.save_bundle(str(zip_path))

        import zipfile
        with zipfile.ZipFile(zip_path) as zf:
            asset_names = [n for n in zf.namelist() if n.startswith('assets/')]
            assert len(asset_names) == 1
            assert zf.read(asset_names[0]) == img_bytes

    @pytest.mark.asyncio
    async def test_save_bundle_css_url_rewriting(self, tab, tmp_path):
        page_url = 'https://example.com/'
        css_url = 'https://example.com/css/style.css'
        font_url = 'https://example.com/css/font.woff2'

        resources = [
            self._make_resource(css_url, 'Stylesheet', 'text/css'),
            self._make_resource(font_url, 'Font', 'font/woff2'),
        ]
        frame_tree = self._make_frame_tree(resources=resources)

        html = f'<html><head><link rel="stylesheet" href="{css_url}"></head><body></body></html>'
        css_content = 'body { font-family: url("font.woff2"); }'
        font_bytes = b'woff2data'

        responses = [
            {'result': {'frameTree': frame_tree}},
            {'result': {'content': html, 'base64Encoded': False}},
            {'result': {'content': css_content, 'base64Encoded': False}},
            {'result': {'content': base64.b64encode(font_bytes).decode(), 'base64Encoded': True}},
        ]
        tab._connection_handler.execute_command = AsyncMock(side_effect=responses)

        zip_path = tmp_path / 'bundle.zip'
        await tab.save_bundle(str(zip_path))

        import zipfile
        with zipfile.ZipFile(zip_path) as zf:
            css_files = [n for n in zf.namelist() if n.endswith('.css')]
            assert len(css_files) == 1
            css_data = zf.read(css_files[0]).decode('utf-8')
            # CSS url() should reference the font's local filename
            assert 'font.woff2' not in css_data or 'assets/' not in css_data
            # The font.woff2 reference should have been rewritten
            assert 'url("' in css_data

    @pytest.mark.asyncio
    async def test_save_bundle_child_frames(self, tab, tmp_path):
        child_resources = [
            self._make_resource('https://example.com/child.css', 'Stylesheet', 'text/css'),
        ]
        child_frame_tree = self._make_frame_tree(
            frame_id='F2',
            page_url='https://example.com/child.html',
            resources=child_resources,
        )
        parent_resources = [
            self._make_resource('https://example.com/main.css', 'Stylesheet', 'text/css'),
        ]
        frame_tree = self._make_frame_tree(
            resources=parent_resources,
            child_frames=[child_frame_tree],
        )

        html = '<html><body></body></html>'
        responses = [
            {'result': {'frameTree': frame_tree}},
            {'result': {'content': html, 'base64Encoded': False}},
            {'result': {'content': 'body{}', 'base64Encoded': False}},
            {'result': {'content': 'p{}', 'base64Encoded': False}},
        ]
        tab._connection_handler.execute_command = AsyncMock(side_effect=responses)

        zip_path = tmp_path / 'bundle.zip'
        await tab.save_bundle(str(zip_path))

        import zipfile
        with zipfile.ZipFile(zip_path) as zf:
            asset_names = [n for n in zf.namelist() if n.startswith('assets/')]
            assert len(asset_names) == 2

    @pytest.mark.asyncio
    async def test_save_bundle_skips_data_urls(self, tab, tmp_path):
        resources = [
            self._make_resource('data:image/png;base64,abc', 'Image', 'image/png'),
            self._make_resource('https://example.com/real.css', 'Stylesheet', 'text/css'),
        ]
        frame_tree = self._make_frame_tree(resources=resources)
        html = '<html><body></body></html>'

        responses = [
            {'result': {'frameTree': frame_tree}},
            {'result': {'content': html, 'base64Encoded': False}},
            {'result': {'content': 'body{}', 'base64Encoded': False}},
        ]
        tab._connection_handler.execute_command = AsyncMock(side_effect=responses)

        zip_path = tmp_path / 'bundle.zip'
        await tab.save_bundle(str(zip_path))

        # Only 3 calls: tree, doc content, real.css — data: URL was skipped
        assert tab._connection_handler.execute_command.call_count == 3

    def test_collect_frame_resources_recursive(self):
        child = {
            'frame': {'id': 'F2', 'url': 'https://example.com/child',
                       'loaderId': 'L2', 'domainAndRegistry': '', 'securityOrigin': '',
                       'mimeType': 'text/html', 'secureContextType': 'Secure',
                       'crossOriginIsolatedContextType': 'NotIsolated',
                       'gatedAPIFeatures': []},
            'resources': [
                {'url': 'https://example.com/c.css', 'type': 'Stylesheet', 'mimeType': 'text/css'},
            ],
        }
        parent = {
            'frame': {'id': 'F1', 'url': 'https://example.com/',
                       'loaderId': 'L1', 'domainAndRegistry': '', 'securityOrigin': '',
                       'mimeType': 'text/html', 'secureContextType': 'Secure',
                       'crossOriginIsolatedContextType': 'NotIsolated',
                       'gatedAPIFeatures': []},
            'resources': [
                {'url': 'https://example.com/p.css', 'type': 'Stylesheet', 'mimeType': 'text/css'},
            ],
            'childFrames': [child],
        }
        result = collect_frame_resources(parent)
        assert len(result) == 2
        assert result[0][0] == 'F1'
        assert result[1][0] == 'F2'

    def test_build_asset_filename(self):
        name = build_asset_filename(
            'https://example.com/css/style.css', 'text/css', 0
        )
        assert name == '0000_style.css'

    def test_build_asset_filename_no_extension(self):
        name = build_asset_filename(
            'https://example.com/api/image', 'image/png', 5
        )
        assert name == '0005_image.png'

    def test_build_asset_filename_no_path(self):
        name = build_asset_filename(
            'https://example.com/', 'text/css', 1
        )
        assert name == '0001_resource.css'

    def test_rewrite_css_urls(self):
        asset_map = {
            'https://example.com/fonts/bold.woff2': (
                '0001_bold.woff2', b'data', 'font/woff2', 'Font'
            ),
        }
        css = 'body { font: url("https://example.com/fonts/bold.woff2"); }'
        result = rewrite_css_urls(
            css, 'https://example.com/css/style.css', asset_map
        )
        assert '0001_bold.woff2' in result

    def test_rewrite_css_urls_relative(self):
        asset_map = {
            'https://example.com/css/bg.png': (
                '0002_bg.png', b'data', 'image/png', 'Image'
            ),
        }
        css = 'div { background: url("bg.png"); }'
        result = rewrite_css_urls(
            css, 'https://example.com/css/style.css', asset_map
        )
        assert '0002_bg.png' in result

    def test_rewrite_css_urls_skips_data_uris(self):
        css = 'div { background: url("data:image/png;base64,abc"); }'
        result = rewrite_css_urls(css, 'https://example.com/style.css', {})
        assert 'data:image/png;base64,abc' in result

    @pytest.mark.asyncio
    async def test_save_bundle_js_fallback_when_resource_content_fails(self, tab, tmp_path):
        """When getResourceContent fails for the document, fall back to JS."""
        frame_tree = self._make_frame_tree(resources=[])
        html = '<html><body>Fallback</body></html>'

        call_count = 0

        async def side_effect(*args, **kwargs):
            nonlocal call_count
            call_count += 1
            if call_count == 1:
                # getResourceTree succeeds
                return {'result': {'frameTree': frame_tree}}
            if call_count == 2:
                # getResourceContent for document fails (no 'result' key)
                return {'error': {'code': -32000, 'message': 'No resource'}}
            if call_count == 3:
                # execute_script fallback
                return {'result': {'result': {'value': html}}}
            return {}

        tab._connection_handler.execute_command = AsyncMock(side_effect=side_effect)

        zip_path = tmp_path / 'bundle.zip'
        await tab.save_bundle(str(zip_path))

        import zipfile
        with zipfile.ZipFile(zip_path) as zf:
            assert zf.read('index.html').decode() == html

================================================
FILE: tests/test_browser/test_har_recorder.py
================================================
"""Tests for pydoll.browser.requests.har_recorder module."""

import json
import pytest
import pytest_asyncio
from pathlib import Path
from unittest.mock import AsyncMock, Mock, patch

from pydoll.browser.requests.har_recorder import HarRecorder, HarCapture
from pydoll.browser.requests.request import Request
from pydoll.protocol.network.events import NetworkEvent


@pytest_asyncio.fixture
async def mock_tab():
    """Create a mock Tab instance for testing."""
    tab = Mock()
    tab.network_events_enabled = False
    tab.enable_network_events = AsyncMock()
    tab.disable_network_events = AsyncMock()
    tab.on = AsyncMock(side_effect=lambda *a, **kw: len(tab.on.call_args_list))
    tab.remove_callback = AsyncMock()
    tab.clear_callbacks = AsyncMock()
    tab._execute_command = AsyncMock(
        return_value={'result': {'body': '', 'base64Encoded': False}}
    )
    return tab


@pytest_asyncio.fixture
async def recorder(mock_tab):
    """Create a HarRecorder instance for testing."""
    return HarRecorder(mock_tab)


@pytest_asyncio.fixture
async def request_instance(mock_tab):
    """Create a Request instance for testing."""
    return Request(mock_tab)


def _make_request_will_be_sent_event(
    request_id='req-1',
    url='https://example.com',
    method='GET',
    wall_time=1700000000.0,
    resource_type='Document',
    redirect_response=None,
):
    """Helper to build a requestWillBeSent CDP event."""
    event = {
        'method': NetworkEvent.REQUEST_WILL_BE_SENT,
        'params': {
            'requestId': request_id,
            'request': {
                'url': url,
                'method': method,
                'headers': {'User-Agent': 'TestBrowser'},
            },
            'wallTime': wall_time,
            'timestamp': 12345.0,
            'type': resource_type,
            'loaderId': 'loader-1',
            'documentURL': url,
            'initiator': {'type': 'other'},
            'redirectHasExtraInfo': False,
        },
    }
    if redirect_response:
        event['params']['redirectResponse'] = redirect_response
    return event


def _make_request_extra_info_event(request_id='req-1'):
    """Helper to build a requestWillBeSentExtraInfo CDP event."""
    return {
        'method': NetworkEvent.REQUEST_WILL_BE_SENT_EXTRA_INFO,
        'params': {
            'requestId': request_id,
            'headers': {'Cookie': 'session=abc123'},
            'associatedCookies': [],
            'connectTiming': {'requestTime': 12345.0},
        },
    }


def _make_response_received_event(
    request_id='req-1',
    status=200,
    status_text='OK',
    mime_type='text/html',
    protocol='h2',
    timing=None,
    remote_ip='93.184.216.34',
):
    """Helper to build a responseReceived CDP event."""
    response = {
        'url': 'https://example.com',
        'status': status,
        'statusText': status_text,
        'headers': {'Content-Type': 'text/html'},
        'mimeType': mime_type,
        'charset': 'utf-8',
        'connectionReused': False,
        'connectionId': 42,
        'encodedDataLength': 1234,
        'securityState': 'secure',
    }
    if protocol:
        response['protocol'] = protocol
    if timing:
        response['timing'] = timing
    if remote_ip:
        response['remoteIPAddress'] = remote_ip
    return {
        'method': NetworkEvent.RESPONSE_RECEIVED,
        'params': {
            'requestId': request_id,
            'loaderId': 'loader-1',
            'timestamp': 12346.0,
            'type': 'Document',
            'response': response,
            'hasExtraInfo': True,
        },
    }


def _make_response_extra_info_event(request_id='req-1'):
    """Helper to build a responseReceivedExtraInfo CDP event."""
    return {
        'method': NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO,
        'params': {
            'requestId': request_id,
            'headers': {'Content-Type': 'text/html', 'Set-Cookie': 'id=val'},
            'blockedCookies': [],
            'resourceIPAddressSpace': 'Public',
            'statusCode': 200,
        },
    }


def _make_data_received_event(request_id='req-1', encoded_data_length=500):
    """Helper to build a dataReceived CDP event."""
    return {
        'method': NetworkEvent.DATA_RECEIVED,
        'params': {
            'requestId': request_id,
            'timestamp': 12346.5,
            'dataLength': encoded_data_length,
            'encodedDataLength': encoded_data_length,
        },
    }


def _make_loading_finished_event(request_id='req-1', encoded_data_length=1234):
    """Helper to build a loadingFinished CDP event."""
    return {
        'method': NetworkEvent.LOADING_FINISHED,
        'params': {
            'requestId': request_id,
            'timestamp': 12347.0,
            'encodedDataLength': float(encoded_data_length),
        },
    }


def _make_loading_failed_event(
    request_id='req-1', error_text='net::ERR_FAILED', canceled=False
):
    """Helper to build a loadingFailed CDP event."""
    return {
        'method': NetworkEvent.LOADING_FAILED,
        'params': {
            'requestId': request_id,
            'timestamp': 12347.0,
            'type': 'Document',
            'errorText': error_text,
            'canceled': canceled,
        },
    }


class TestHarRecorderStart:
    """Test HarRecorder.start()."""

    @pytest.mark.asyncio
    async def test_start_registers_seven_callbacks(self, recorder, mock_tab):
        await recorder.start()
        assert mock_tab.on.call_count == 7

    @pytest.mark.asyncio
    async def test_start_stores_callback_ids(self, recorder, mock_tab):
        await recorder.start()
        assert len(recorder._callback_ids) == 7

    @pytest.mark.asyncio
    async def test_start_enables_network_events_if_not_enabled(self, recorder, mock_tab):
        mock_tab.network_events_enabled = False
        await recorder.start()
        mock_tab.enable_network_events.assert_called_once()
        assert recorder._network_was_enabled is True

    @pytest.mark.asyncio
    async def test_start_skips_network_enable_if_already_enabled(self, recorder, mock_tab):
        mock_tab.network_events_enabled = True
        await recorder.start()
        mock_tab.enable_network_events.assert_not_called()
        assert recorder._network_was_enabled is False

    @pytest.mark.asyncio
    async def test_start_registers_correct_events(self, recorder, mock_tab):
        await recorder.start()
        registered_events = [call.args[0] for call in mock_tab.on.call_args_list]
        assert NetworkEvent.REQUEST_WILL_BE_SENT in registered_events
        assert NetworkEvent.REQUEST_WILL_BE_SENT_EXTRA_INFO in registered_events
        assert NetworkEvent.RESPONSE_RECEIVED in registered_events
        assert NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO in registered_events
        assert NetworkEvent.DATA_RECEIVED in registered_events
        assert NetworkEvent.LOADING_FINISHED in registered_events
        assert NetworkEvent.LOADING_FAILED in registered_events

    @pytest.mark.asyncio
    async def test_start_sets_start_time(self, recorder, mock_tab):
        assert recorder._start_time is None
        await recorder.start()
        assert recorder._start_time is not None


class TestHarRecorderStop:
    """Test HarRecorder.stop()."""

    @pytest.mark.asyncio
    async def test_stop_removes_all_callbacks(self, recorder, mock_tab):
        await recorder.start()
        await recorder.stop()
        assert mock_tab.remove_callback.call_count == 7

    @pytest.mark.asyncio
    async def test_stop_clears_callback_ids(self, recorder, mock_tab):
        await recorder.start()
        await recorder.stop()
        assert recorder._callback_ids == []

    @pytest.mark.asyncio
    async def test_stop_disables_network_events_if_we_enabled(self, recorder, mock_tab):
        mock_tab.network_events_enabled = False
        await recorder.start()
        await recorder.stop()
        mock_tab.disable_network_events.assert_called_once()

    @pytest.mark.asyncio
    async def test_stop_does_not_disable_network_events_if_not_ours(self, recorder, mock_tab):
        mock_tab.network_events_enabled = True
        await recorder.start()
        await recorder.stop()
        mock_tab.disable_network_events.assert_not_called()

    @pytest.mark.asyncio
    async def test_stop_flushes_pending_entries(self, recorder, mock_tab):
        await recorder.start()
        recorder._pending['req-1'] = {
            'url': 'https://example.com',
            'method': 'GET',
            'request_headers': {},
            'wall_time': 1700000000.0,
        }
        await recorder.stop()
        assert len(recorder._entries) == 1
        assert recorder._pending == {}


class TestHarRecorderEventHandlers:
    """Test individual event handler methods."""

    @pytest.mark.asyncio
    async def test_request_will_be_sent_creates_pending(self, recorder):
        event = _make_request_will_be_sent_event()
        recorder._on_request_will_be_sent(event)
        assert 'req-1' in recorder._pending
        assert recorder._pending['req-1']['url'] == 'https://example.com'
        assert recorder._pending['req-1']['method'] == 'GET'

    @pytest.mark.asyncio
    async def test_request_extra_info_merges_headers(self, recorder):
        recorder._on_request_will_be_sent(_make_request_will_be_sent_event())
        recorder._on_request_extra_info(_make_request_extra_info_event())
        assert 'request_headers_extra' in recorder._pending['req-1']
        assert recorder._pending['req-1']['request_headers_extra']['Cookie'] == 'session=abc123'

    @pytest.mark.asyncio
    async def test_request_extra_info_skips_unknown_request(self, recorder):
        recorder._on_request_extra_info(_make_request_extra_info_event('unknown-req'))
        assert 'unknown-req' not in recorder._pending

    @pytest.mark.asyncio
    async def test_response_received_stores_data(self, recorder):
        recorder._on_request_will_be_sent(_make_request_will_be_sent_event())
        recorder._on_response_received(_make_response_received_event())
        pending = recorder._pending['req-1']
        assert pending['status'] == 200
        assert pending['status_text'] == 'OK'
        assert pending['mime_type'] == 'text/html'
        assert pending['protocol'] == 'h2'
        assert pending['remote_ip'] == '93.184.216.34'

    @pytest.mark.asyncio
    async def test_response_received_skips_unknown_request(self, recorder):
        recorder._on_response_received(_make_response_received_event('unknown-req'))
        assert 'unknown-req' not in recorder._pending

    @pytest.mark.asyncio
    async def test_response_extra_info_merges_headers(self, recorder):
        recorder._on_request_will_be_sent(_make_request_will_be_sent_event())
        recorder._on_response_extra_info(_make_response_extra_info_event())
        assert 'response_headers_extra' in recorder._pending['req-1']

    @pytest.mark.asyncio
    async def test_loading_finished_creates_entry(self, recorder, mock_tab):
        recorder._on_request_will_be_sent(_make_request_will_be_sent_event())
        recorder._on_response_received(_make_response_received_event())
        recorder._on_loading_finished(_make_loading_finished_event())

        # Wait for the background task to complete
        if recorder._body_tasks:
            import asyncio
            await asyncio.gather(*recorder._body_tasks, return_exceptions=True)

        assert len(recorder._entries) == 1
        assert 'req-1' not in recorder._pending
        entry = recorder._entries[0]
        assert entry['request']['url'] == 'https://example.com'
        assert entry['response']['status'] == 200

    @pytest.mark.asyncio
    async def test_loading_finished_skips_unknown_request(self, recorder):
        recorder._on_loading_finished(_make_loading_finished_event('unknown-req'))
        assert len(recorder._entries) == 0

    @pytest.mark.asyncio
    async def test_loading_failed_creates_entry(self, recorder):
        recorder._on_request_will_be_sent(_make_request_will_be_sent_event())
        recorder._on_loading_failed(_make_loading_failed_event())
        assert len(recorder._entries) == 1
        assert 'req-1' not in recorder._pending
        entry = recorder._entries[0]
        assert entry['response']['status'] == 0
        assert entry['response']['statusText'] == 'net::ERR_FAILED'

    @pytest.mark.asyncio
    async def test_loading_failed_skips_unknown_request(self, recorder):
        recorder._on_loading_failed(_make_loading_failed_event('unknown-req'))
        assert len(recorder._entries) == 0

    @pytest.mark.asyncio
    async def test_redirect_handling(self, recorder, mock_tab):
        redirect_response = {
            'url': 'https://example.com',
            'status': 301,
            'statusText': 'Moved Permanently',
            'headers': {'Location': 'https://www.example.com'},
            'mimeType': 'text/html',
            'charset': 'utf-8',
            'connectionReused': False,
            'connectionId': 42,
            'encodedDataLength': 200,
            'securityState': 'secure',
        }
        event1 = _make_request_will_be_sent_event(request_id='req-1')
        recorder._on_request_will_be_sent(event1)

        event2 = _make_request_will_be_sent_event(
            request_id='req-1',
            url='https://www.example.com',
            redirect_response=redirect_response,
        )
        recorder._on_request_will_be_sent(event2)

        # First entry is the redirect
        assert len(recorder._entries) == 1
        assert recorder._entries[0]['response']['status'] == 301

        # req-1 still pending for the final URL
        assert 'req-1' in recorder._pending
        assert recorder._pending['req-1']['url'] == 'https://www.example.com'


class TestHarRecorderHelpers:
    """Test static helper methods."""

    def test_headers_dict_to_list(self):
        headers = {'Content-Type': 'text/html', 'Accept': '*/*'}
        result = HarRecorder._headers_dict_to_list(headers)
        assert len(result) == 2
        assert {'name': 'Content-Type', 'value': 'text/html'} in result
        assert {'name': 'Accept', 'value': '*/*'} in result

    def test_headers_dict_to_list_empty(self):
        assert HarRecorder._headers_dict_to_list({}) == []

    def test_parse_query_string(self):
        url = 'https://example.com/search?q=test&page=1'
        result = HarRecorder._parse_query_string(url)
        assert len(result) == 2
        names = [p['name'] for p in result]
        assert 'q' in names
        assert 'page' in names

    def test_parse_query_string_no_query(self):
        assert HarRecorder._parse_query_string('https://example.com') == []

    def test_parse_query_string_empty_values(self):
        url = 'https://example.com?flag='
        result = HarRecorder._parse_query_string(url)
        assert len(result) == 1
        assert result[0]['name'] == 'flag'
        assert result[0]['value'] == ''

    def test_wall_time_to_iso(self):
        result = HarRecorder._wall_time_to_iso(1700000000.0)
        assert '2023-11-14' in result
        assert '+00:00' in result or 'Z' in result

    def test_wall_time_to_iso_zero(self):
        result = HarRecorder._wall_time_to_iso(0)
        # Should return current time ISO string
        assert 'T' in result

    def test_build_har_timings_none(self):
        result = HarRecorder._build_har_timings(None)
        assert result['blocked'] == -1
        assert result['dns'] == -1
        assert result['connect'] == -1
        assert result['ssl'] == -1
        assert result['send'] == 0
        assert result['wait'] == 0
        assert result['receive'] == 0

    def test_build_har_timings_with_data(self):
        timing = {
            'requestTime': 12345.0,
            'proxyStart': -1,
            'proxyEnd': -1,
            'dnsStart': 0.5,
            'dnsEnd': 5.0,
            'connectStart': 5.0,
            'connectEnd': 50.0,
            'sslStart': 10.0,
            'sslEnd': 45.0,
            'workerStart': -1,
            'workerReady': -1,
            'workerFetchStart': -1,
            'workerRespondWithSettled': -1,
            'sendStart': 50.0,
            'sendEnd': 51.0,
            'pushStart': 0,
            'pushEnd': 0,
            'receiveHeadersStart': 100.0,
            'receiveHeadersEnd': 105.0,
        }
        result = HarRecorder._build_har_timings(timing)
        assert result['dns'] == 4.5
        assert result['connect'] == 45.0
        assert result['ssl'] == 35.0
        assert result['send'] == 1.0
        assert result['wait'] == 49.0
        # receive defaults to 0 when no receive_ms is provided
        assert result['receive'] == 0

    def test_build_har_timings_with_receive_ms(self):
        timing = {
            'requestTime': 12345.0,
            'proxyStart': -1,
            'proxyEnd': -1,
            'dnsStart': 0.5,
            'dnsEnd': 5.0,
            'connectStart': 5.0,
            'connectEnd': 50.0,
            'sslStart': 10.0,
            'sslEnd': 45.0,
            'workerStart': -1,
            'workerReady': -1,
            'workerFetchStart': -1,
            'workerRespondWithSettled': -1,
            'sendStart': 50.0,
            'sendEnd': 51.0,
            'pushStart': 0,
            'pushEnd': 0,
            'receiveHeadersStart': 100.0,
            'receiveHeadersEnd': 105.0,
        }
        # Providing receive_ms overrides any header-based calculation
        result = HarRecorder._build_har_timings(timing, receive_ms=250.5)
        assert result['receive'] == 250.5
        assert result['dns'] == 4.5
        assert result['send'] == 1.0

    def test_build_har_timings_no_ssl(self):
        timing = {
            'requestTime': 12345.0,
            'proxyStart': -1,
            'proxyEnd': -1,
            'dnsStart': -1,
            'dnsEnd': -1,
            'connectStart': -1,
            'connectEnd': -1,
            'sslStart': -1,
            'sslEnd': -1,
            'workerStart': -1,
            'workerReady': -1,
            'workerFetchStart': -1,
            'workerRespondWithSettled': -1,
            'sendStart': 10.0,
            'sendEnd': 11.0,
            'pushStart': 0,
            'pushEnd': 0,
            'receiveHeadersStart': 50.0,
            'receiveHeadersEnd': 55.0,
        }
        result = HarRecorder._build_har_timings(timing, receive_ms=500.0)
        assert result['dns'] == -1
        assert result['connect'] == -1
        assert result['ssl'] == -1
        assert result['send'] == 1.0
        assert result['wait'] == 39.0
        assert result['receive'] == 500.0


class TestHarRecorderBuildEntry:
    """Test the entry building logic."""

    @pytest.mark.asyncio
    async def test_build_entry_basic(self, recorder):
        pending = {
            'url': 'https://example.com',
            'method': 'GET',
            'request_headers': {'User-Agent': 'Test'},
            'wall_time': 1700000000.0,
            'status': 200,
            'status_text': 'OK',
            'response_headers': {'Content-Type': 'text/html'},
            'mime_type': 'text/html',
            'protocol': 'h2',
        }
        entry = recorder._build_entry(pending)
        assert entry['request']['method'] == 'GET'
        assert entry['request']['url'] == 'https://example.com'
        assert entry['response']['status'] == 200

    @pytest.mark.asyncio
    async def test_build_entry_with_post_data(self, recorder):
        pending = {
            'url': 'https://example.com/api',
            'method': 'POST',
            'request_headers': {'Content-Type': 'application/json'},
            'post_data': '{"key": "value"}',
            'wall_time': 1700000000.0,
            'status': 201,
            'status_text': 'Created',
            'response_headers': {},
            'mime_type': 'application/json',
            'protocol': 'h2',
        }
        entry = recorder._build_entry(pending)
        assert 'postData' in entry['request']
        assert entry['request']['postData']['text'] == '{"key": "value"}'
        assert entry['request']['postData']['mimeType'] == 'application/json'
        assert entry['request']['bodySize'] == len('{"key": "value"}')

    @pytest.mark.asyncio
    async def test_build_entry_with_response_body(self, recorder):
        pending = {
            'url': 'https://example.com',
            'method': 'GET',
            'request_headers': {},
            'wall_time': 1700000000.0,
            'status': 200,
            'status_text': 'OK',
            'response_headers': {},
            'mime_type': 'text/html',
            'protocol': 'h2',
            'response_body': '<html></html>',
            'response_body_base64': False,
        }
        entry = recorder._build_entry(pending)
        assert entry['response']['content']['text'] == '<html></html>'
        assert 'encoding' not in entry['response']['content']

    @pytest.mark.asyncio
    async def test_build_entry_with_base64_body(self, recorder):
        pending = {
            'url': 'https://example.com/image.png',
            'method': 'GET',
            'request_headers': {},
            'wall_time': 1700000000.0,
            'status': 200,
            'status_text': 'OK',
            'response_headers': {},
            'mime_type': 'image/png',
            'protocol': 'h2',
            'response_body': 'iVBORw0KGgo=',
            'response_body_base64': True,
        }
        entry = recorder._build_entry(pending)
        assert entry['response']['content']['encoding'] == 'base64'

    @pytest.mark.asyncio
    async def test_build_entry_with_server_ip(self, recorder):
        pending = {
            'url': 'https://example.com',
            'method': 'GET',
            'request_headers': {},
            'wall_time': 1700000000.0,
            'status': 200,
            'status_text': 'OK',
            'response_headers': {},
            'mime_type': 'text/html',
            'remote_ip': '93.184.216.34',
        }
        entry = recorder._build_entry(pending)
        assert entry['serverIPAddress'] == '93.184.216.34'

    @pytest.mark.asyncio
    async def test_build_entry_with_resource_type(self, recorder):
        pending = {
            'url': 'https://example.com/style.css',
            'method': 'GET',
            'request_headers': {},
            'wall_time': 1700000000.0,
            'status': 200,
            'status_text': 'OK',
            'response_headers': {},
            'mime_type': 'text/css',
            'resource_type': 'Stylesheet',
        }
        entry = recorder._build_entry(pending)
        assert entry['_resourceType'] == 'Stylesheet'

    @pytest.mark.asyncio
    async def test_build_entry_uses_extra_headers_when_available(self, recorder):
        pending = {
            'url': 'https://example.com',
            'method': 'GET',
            'request_headers': {'User-Agent': 'original'},
            'request_headers_extra': {'User-Agent': 'actual', 'Cookie': 'x=1'},
            'response_headers': {'Content-Type': 'text/html'},
            'response_headers_extra': {'Content-Type': 'text/html', 'Set-Cookie': 'y=2'},
            'wall_time': 1700000000.0,
            'status': 200,
            'status_text': 'OK',
            'mime_type': 'text/html',
        }
        entry = recorder._build_entry(pending)
        req_header_names = [h['name'] for h in entry['request']['headers']]
        assert 'Cookie' in req_header_names
        resp_header_names = [h['name'] for h in entry['response']['headers']]
        assert 'Set-Cookie' in resp_header_names


class TestHarCapture:
    """Test HarCapture user-facing class."""

    @pytest.mark.asyncio
    async def test_entries_returns_copy(self, recorder):
        recorder._entries.append(
            {
                'startedDateTime': '2023-01-01T00:00:00+00:00',
                'time': 100.0,
                'request': {},
                'response': {},
                'timings': {},
            }
        )
        recording = HarCapture(recorder)
        entries = recording.entries
        assert len(entries) == 1
        entries.clear()
        # Original entries should not be affected
        assert len(recording.entries) == 1

    @pytest.mark.asyncio
    async def test_to_dict_structure(self, recorder):
        recording = HarCapture(recorder)
        har = recording.to_dict()
        assert 'log' in har
        assert har['log']['version'] == '1.2'
        assert har['log']['creator']['name'] == 'pydoll'
        assert isinstance(har['log']['pages'], list)
        assert isinstance(har['log']['entries'], list)

    @pytest.mark.asyncio
    async def test_to_dict_includes_entries(self, recorder):
        recorder._entries.append(
            {
                'startedDateTime': '2023-01-01T00:00:00+00:00',
                'time': 100.0,
                'request': {'method': 'GET', 'url': 'https://example.com'},
                'response': {'status': 200},
                'timings': {},
            }
        )
        recording = HarCapture(recorder)
        har = recording.to_dict()
        assert len(har['log']['entries']) == 1

    @pytest.mark.asyncio
    async def test_save_writes_json_file(self, recorder, tmp_path):
        recorder._entries.append(
            {
                'startedDateTime': '2023-01-01T00:00:00+00:00',
                'time': 100.0,
                'request': {'method': 'GET', 'url': 'https://example.com'},
                'response': {'status': 200},
                'timings': {},
            }
        )
        recording = HarCapture(recorder)
        file_path = tmp_path / 'test.har'
        recording.save(file_path)

        assert file_path.exists()
        with open(file_path) as f:
            data = json.load(f)
        assert data['log']['version'] == '1.2'
        assert len(data['log']['entries']) == 1

    @pytest.mark.asyncio
    async def test_save_with_string_path(self, recorder, tmp_path):
        recording = HarCapture(recorder)
        file_path = str(tmp_path / 'test.har')
        recording.save(file_path)
        assert Path(file_path).exists()

    @pytest.mark.asyncio
    async def test_save_creates_parent_directories(self, recorder, tmp_path):
        recording = HarCapture(recorder)
        file_path = tmp_path / 'sub' / 'dir' / 'test.har'
        recording.save(file_path)
        assert file_path.exists()


class TestRequestRecord:
    """Test Request.record() context manager."""

    @pytest.mark.asyncio
    async def test_record_yields_har_recording(self, request_instance):
        async with request_instance.record() as recording:
            assert isinstance(recording, HarCapture)

    @pytest.mark.asyncio
    async def test_record_enables_network_events(self, request_instance, mock_tab):
        mock_tab.network_events_enabled = False
        async with request_instance.record():
            pass
        mock_tab.enable_network_events.assert_called_once()

    @pytest.mark.asyncio
    async def test_record_registers_and_removes_callbacks(self, request_instance, mock_tab):
        async with request_instance.record():
            assert mock_tab.on.call_count == 7
        assert mock_tab.remove_callback.call_count == 7

    @pytest.mark.asyncio
    async def test_record_cleans_up_on_exception(self, request_instance, mock_tab):
        with pytest.raises(ValueError, match='test error'):
            async with request_instance.record():
                raise ValueError('test error')
        # Cleanup should still happen
        assert mock_tab.remove_callback.call_count == 7

    @pytest.mark.asyncio
    async def test_record_disables_network_events_if_enabled_by_recorder(
        self, request_instance, mock_tab
    ):
        mock_tab.network_events_enabled = False
        async with request_instance.record():
            pass
        mock_tab.disable_network_events.assert_called_once()

    @pytest.mark.asyncio
    async def test_record_does_not_disable_network_events_if_already_enabled(
        self, request_instance, mock_tab
    ):
        mock_tab.network_events_enabled = True
        async with request_instance.record():
            pass
        mock_tab.disable_network_events.assert_not_called()


class TestResourceTypeFiltering:
    """Test resource type filtering in HarRecorder."""

    @pytest.mark.asyncio
    async def test_filter_skips_non_matching_types(self, mock_tab):
        from pydoll.protocol.network.types import ResourceType
        recorder = HarRecorder(mock_tab, resource_types=[ResourceType.FETCH])
        await recorder.start()

        event = {
            'params': {
                'requestId': 'req1',
                'request': {'url': 'https://example.com', 'method': 'GET', 'headers': {}},
                'wallTime': 1000.0,
                'timestamp': 100.0,
                'type': 'Document',
            }
        }
        recorder._on_request_will_be_sent(event)
        assert 'req1' not in recorder._pending

    @pytest.mark.asyncio
    async def test_filter_accepts_matching_types(self, mock_tab):
        from pydoll.protocol.network.types import ResourceType
        recorder = HarRecorder(mock_tab, resource_types=[ResourceType.FETCH])
        await recorder.start()

        event = {
            'params': {
                'requestId': 'req1',
                'request': {'url': 'https://example.com/api', 'method': 'GET', 'headers': {}},
                'wallTime': 1000.0,
                'timestamp': 100.0,
                'type': 'Fetch',
            }
        }
        recorder._on_request_will_be_sent(event)
        assert 'req1' in recorder._pending

    @pytest.mark.asyncio
    async def test_no_filter_accepts_all(self, mock_tab):
        recorder = HarRecorder(mock_tab)
        await recorder.start()

        event = {
            'params': {
                'requestId': 'req1',
                'request': {'url': 'https://example.com', 'method': 'GET', 'headers': {}},
                'wallTime': 1000.0,
                'timestamp': 100.0,
                'type': 'Document',
            }
        }
        recorder._on_request_will_be_sent(event)
        assert 'req1' in recorder._pending

    @pytest.mark.asyncio
    async def test_record_passes_resource_types(self, request_instance, mock_tab):
        from pydoll.protocol.network.types import ResourceType
        async with request_instance.record(
            resource_types=[ResourceType.XHR, ResourceType.FETCH]
        ) as capture:
            assert isinstance(capture, HarCapture)


class TestHarRecorderFetchResponseBody:
    """Test response body fetching."""

    @pytest.mark.asyncio
    async def test_fetch_response_body_success(self, recorder, mock_tab):
        mock_tab._execute_command.return_value = {
            'result': {'body': '<html>Hello</html>', 'base64Encoded': False}
        }
        body, is_base64 = await recorder._fetch_response_body('req-1')
        assert body == '<html>Hello</html>'
        assert is_base64 is False

    @pytest.mark.asyncio
    async def test_fetch_response_body_base64(self, recorder, mock_tab):
        mock_tab._execute_command.return_value = {
            'result': {'body': 'aW1hZ2VkYXRh', 'base64Encoded': True}
        }
        body, is_base64 = await recorder._fetch_response_body('req-1')
        assert body == 'aW1hZ2VkYXRh'
        assert is_base64 is True

    @pytest.mark.asyncio
    async def test_fetch_response_body_failure(self, recorder, mock_tab):
        mock_tab._execute_command.side_effect = Exception('Network error')
        body, is_base64 = await recorder._fetch_response_body('req-1')
        assert body == ''
        assert is_base64 is False


class TestHarRecorderEndToEnd:
    """End-to-end tests simulating full request lifecycle."""

    @pytest.mark.asyncio
    async def test_full_request_lifecycle(self, recorder, mock_tab):
        mock_tab._execute_command.return_value = {
            'result': {'body': '<html>Test</html>', 'base64Encoded': False}
        }

        # Simulate a full request lifecycle
        recorder._on_request_will_be_sent(_make_request_will_be_sent_event())
        recorder._on_request_extra_info(_make_request_extra_info_event())
        recorder._on_response_received(_make_response_received_event())
        recorder._on_response_extra_info(_make_response_extra_info_event())
        recorder._on_loading_finished(_make_loading_finished_event())

        # Wait for async body fetch
        import asyncio
        if recorder._body_tasks:
            await asyncio.gather(*recorder._body_tasks, return_exceptions=True)

        assert len(recorder._entries) == 1
        entry = recorder._entries[0]
        assert entry['request']['method'] == 'GET'
        assert entry['request']['url'] == 'https://example.com'
        assert entry['response']['status'] == 200
        assert entry['response']['content']['text'] == '<html>Test</html>'
        assert entry['_resourceType'] == 'Document'
        assert entry['serverIPAddress'] == '93.184.216.34'
        # Extra headers should be preferred
        req_headers = {h['name']: h['value'] for h in entry['request']['headers']}
        assert 'Cookie' in req_headers

    @pytest.mark.asyncio
    async def test_multiple_concurrent_requests(self, recorder, mock_tab):
        mock_tab._execute_command.return_value = {
            'result': {'body': '', 'base64Encoded': False}
        }

        # Two concurrent requests
        recorder._on_request_will_be_sent(
            _make_request_will_be_sent_event('req-1', 'https://example.com/a')
        )
        recorder._on_request_will_be_sent(
            _make_request_will_be_sent_event('req-2', 'https://example.com/b')
        )
        recorder._on_response_received(_make_response_received_event('req-1'))
        recorder._on_response_received(_make_response_received_event('req-2'))
        recorder._on_loading_finished(_make_loading_finished_event('req-1'))
        recorder._on_loading_finished(_make_loading_finished_event('req-2'))

        import asyncio
        if recorder._body_tasks:
            await asyncio.gather(*recorder._body_tasks, return_exceptions=True)

        assert len(recorder._entries) == 2
        urls = [e['request']['url'] for e in recorder._entries]
        assert 'https://example.com/a' in urls
        assert 'https://example.com/b' in urls


class TestHarRecorderCookieParsing:
    """Test cookie parsing from headers."""

    def test_parse_request_cookies(self):
        headers = {'Cookie': 'session=abc123; user=john; theme=dark'}
        result = HarRecorder._parse_request_cookies(headers)
        assert len(result) == 3
        names = [c['name'] for c in result]
        assert 'session' in names
        assert 'user' in names
        assert 'theme' in names

    def test_parse_request_cookies_empty(self):
        assert HarRecorder._parse_request_cookies({}) == []

    def test_parse_request_cookies_lowercase_header(self):
        headers = {'cookie': 'token=xyz'}
        result = HarRecorder._parse_request_cookies(headers)
        assert len(result) == 1
        assert result[0]['name'] == 'token'

    def test_parse_response_cookies(self):
        headers = {'Set-Cookie': 'id=val; Path=/; HttpOnly; Secure'}
        result = HarRecorder._parse_response_cookies(headers)
        assert len(result) == 1
        assert result[0]['name'] == 'id'
        assert result[0]['value'] == 'val'
        assert result[0].get('httpOnly') is True
        assert result[0].get('secure') is True
        assert result[0].get('path') == '/'

    def test_parse_response_cookies_multiple(self):
        headers = {'Set-Cookie': 'a=1; Path=/\nb=2; Domain=.example.com'}
        result = HarRecorder._parse_response_cookies(headers)
        assert len(result) == 2
        names = [c['name'] for c in result]
        assert 'a' in names
        assert 'b' in names

    def test_parse_response_cookies_empty(self):
        assert HarRecorder._parse_response_cookies({}) == []

    def test_parse_response_cookies_with_domain(self):
        headers = {'Set-Cookie': 'sess=abc; Domain=.example.com; Path=/api'}
        result = HarRecorder._parse_response_cookies(headers)
        assert len(result) == 1
        assert result[0].get('domain') == '.example.com'
        assert result[0].get('path') == '/api'


class TestHarRecorderBodySizes:
    """Test correct body size calculations."""

    @pytest.mark.asyncio
    async def test_response_body_size_uses_data_received_bytes(self, recorder):
        """bodySize should come from dataReceived chunks, not transfer_size."""
        pending = {
            'url': 'https://example.com',
            'method': 'GET',
            'request_headers': {},
            'wall_time': 1700000000.0,
            'status': 200,
            'status_text': 'OK',
            'response_headers': {},
            'mime_type': 'text/html',
            'response_body': '<html>Hello</html>',
            'response_body_base64': False,
            'body_bytes': 3200,
        }
        entry = recorder._build_entry(pending)
        assert entry['response']['bodySize'] == 3200

    @pytest.mark.asyncio
    async def test_response_body_size_unknown_returns_negative_one(self, recorder):
        """bodySize should be -1 when no dataReceived data is available."""
        pending = {
            'url': 'https://example.com',
            'method': 'GET',
            'request_headers': {},
            'wall_time': 1700000000.0,
            'status': 200,
            'status_text': 'OK',
            'response_headers': {},
            'mime_type': 'text/html',
        }
        entry = recorder._build_entry(pending)
        assert entry['response']['bodySize'] == -1

    @pytest.mark.asyncio
    async def test_response_body_size_304_is_zero(self, recorder):
        """For 304 (cache hit), bodySize must be 0 per HAR spec."""
        pending = {
            'url': 'https://example.com',
            'method': 'GET',
            'request_headers': {},
            'wall_time': 1700000000.0,
            'status': 304,
            'status_text': 'Not Modified',
            'response_headers': {},
            'mime_type': 'text/html',
            'body_bytes': 100,
        }
        entry = recorder._build_entry(pending)
        assert entry['response']['bodySize'] == 0

    @pytest.mark.asyncio
    async def test_content_size_base64_decoded(self, recorder):
        import base64
        original = b'binary data here'
        b64_body = base64.b64encode(original).decode()
        pending = {
            'url': 'https://example.com/img.png',
            'method': 'GET',
            'request_headers': {},
            'wall_time': 1700000000.0,
            'status': 200,
            'status_text': 'OK',
            'response_headers': {},
            'mime_type': 'image/png',
            'response_body': b64_body,
            'response_body_base64': True,
        }
        entry = recorder._build_entry(pending)
        assert entry['response']['content']['size'] == len(original)
        assert entry['response']['content']['encoding'] == 'base64'

    @pytest.mark.asyncio
    async def test_request_body_size_bytes(self, recorder):
        pending = {
            'url': 'https://example.com/api',
            'method': 'POST',
            'request_headers': {'Content-Type': 'application/json'},
            'post_data': '{"emoji": "\u2764"}',
            'wall_time': 1700000000.0,
            'status': 200,
            'status_text': 'OK',
            'response_headers': {},
            'mime_type': 'application/json',
        }
        entry = recorder._build_entry(pending)
        # UTF-8 encoded size, not len(str)
        expected = len('{"emoji": "\u2764"}'.encode('utf-8'))
        assert entry['request']['bodySize'] == expected


class TestHarRecorderCacheField:
    """Test that entries include the cache field."""

    @pytest.mark.asyncio
    async def test_entry_has_cache_field(self, recorder):
        pending = {
            'url': 'https://example.com',
            'method': 'GET',
            'request_headers': {},
            'wall_time': 1700000000.0,
            'status': 200,
            'status_text': 'OK',
            'response_headers': {},
            'mime_type': 'text/html',
        }
        entry = recorder._build_entry(pending)
        assert 'cache' in entry
        assert entry['cache'] == {}


class TestHarRecorderCookiesInEntries:
    """Test that cookies are populated from headers in entries."""

    @pytest.mark.asyncio
    async def test_request_cookies_from_cookie_header(self, recorder):
        pending = {
            'url': 'https://example.com',
            'method': 'GET',
            'request_headers': {'Cookie': 'session=abc; user=john'},
            'wall_time': 1700000000.0,
            'status': 200,
            'status_text': 'OK',
            'response_headers': {},
            'mime_type': 'text/html',
        }
        entry = recorder._build_entry(pending)
        assert len(entry['request']['cookies']) == 2
        names = [c['name'] for c in entry['request']['cookies']]
        assert 'session' in names
        assert 'user' in names

    @pytest.mark.asyncio
    async def test_response_cookies_from_set_cookie(self, recorder):
        pending = {
            'url': 'https://example.com',
            'method': 'GET',
            'request_headers': {},
            'wall_time': 1700000000.0,
            'status': 200,
            'status_text': 'OK',
            'response_headers': {'Set-Cookie': 'id=val; HttpOnly'},
            'mime_type': 'text/html',
        }
        entry = recorder._build_entry(pending)
        assert len(entry['response']['cookies']) == 1
        assert entry['response']['cookies'][0]['name'] == 'id'
        assert entry['response']['cookies'][0].get('httpOnly') is True


class TestHarRecorderDataReceived:
    """Test Network.dataReceived handling for accurate bodySize."""

    def test_data_received_accumulates_bytes(self, recorder):
        recorder._on_data_received(_make_data_received_event('req-1', 500))
        recorder._on_data_received(_make_data_received_event('req-1', 300))
        assert recorder._data_received_sizes['req-1'] == 800

    def test_data_received_separate_requests(self, recorder):
        recorder._on_data_received(_make_data_received_event('req-1', 500))
        recorder._on_data_received(_make_data_received_event('req-2', 700))
        assert recorder._data_received_sizes['req-1'] == 500
        assert recorder._data_received_sizes['req-2'] == 700

    @pytest.mark.asyncio
    async def test_loading_finished_consumes_data_received(self, recorder, mock_tab):
        recorder._on_request_will_be_sent(_make_request_will_be_sent_event())
        recorder._on_response_received(_make_response_received_event())
        recorder._on_data_received(_make_data_received_event('req-1', 1000))
        recorder._on_data_received(_make_data_received_event('req-1', 500))
        recorder._on_loading_finished(_make_loading_finished_event())

        import asyncio
        if recorder._body_tasks:
            await asyncio.gather(*recorder._body_tasks, return_exceptions=True)

        assert 'req-1' not in recorder._data_received_sizes
        assert len(recorder._entries) == 1
        assert recorder._entries[0]['response']['bodySize'] == 1500

    def test_loading_failed_cleans_up_data_received(self, recorder):
        recorder._on_request_will_be_sent(_make_request_will_be_sent_event())
        recorder._on_data_received(_make_data_received_event('req-1', 200))
        recorder._on_loading_failed(_make_loading_failed_event())
        assert 'req-1' not in recorder._data_received_sizes


class TestHarRecorderExtraStatusCode:
    """Test that responseReceivedExtraInfo statusCode overrides responseReceived status."""

    @pytest.mark.asyncio
    async def test_extra_status_code_overrides_response_status(self, recorder, mock_tab):
        """For cached requests, extraInfo statusCode (304) should win over responseReceived (200)."""
        recorder._on_request_will_be_sent(_make_request_will_be_sent_event())
        recorder._on_response_received(_make_response_received_event(status=200))

        # extraInfo says the real status is 304
        extra_event = {
            'method': NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO,
            'params': {
                'requestId': 'req-1',
                'headers': {'Content-Type': 'text/html'},
                'blockedCookies': [],
                'resourceIPAddressSpace': 'Public',
                'statusCode': 304,
            },
        }
        recorder._on_response_extra_info(extra_event)
        recorder._on_loading_finished(_make_loading_finished_event())

        import asyncio
        if recorder._body_tasks:
            await asyncio.gather(*recorder._body_tasks, return_exceptions=True)

        assert len(recorder._entries) == 1
        assert recorder._entries[0]['response']['status'] == 304
        assert recorder._entries[0]['response']['bodySize'] == 0

    @pytest.mark.asyncio
    async def test_normal_status_when_no_extra(self, recorder, mock_tab):
        recorder._on_request_will_be_sent(_make_request_will_be_sent_event())
        recorder._on_response_received(_make_response_received_event(status=200))
        recorder._on_loading_finished(_make_loading_finished_event())

        import asyncio
        if recorder._body_tasks:
            await asyncio.gather(*recorder._body_tasks, return_exceptions=True)

        assert recorder._entries[0]['response']['status'] == 200


class TestHarRecorderReceiveTiming:
    """Test that receive timing uses monotonic timestamps."""

    @pytest.mark.asyncio
    async def test_receive_from_monotonic_timestamps(self, recorder, mock_tab):
        """receive = (loadingFinished.timestamp - responseReceived.timestamp) * 1000."""
        recorder._on_request_will_be_sent(_make_request_will_be_sent_event())
        # responseReceived has timestamp=12346.0 (from helper)
        recorder._on_response_received(_make_response_received_event())
        # loadingFinished has timestamp=12347.0 (from helper)
        recorder._on_loading_finished(_make_loading_finished_event())

        import asyncio
        if recorder._body_tasks:
            await asyncio.gather(*recorder._body_tasks, return_exceptions=True)

        entry = recorder._entries[0]
        # (12347.0 - 12346.0) * 1000 = 1000ms
        assert entry['timings']['receive'] == 1000.0

    def test_receive_fallback_zero_without_timestamps(self, recorder):
        """When no timestamps available, receive should be 0."""
        pending = {
            'url': 'https://example.com',
            'method': 'GET',
            'request_headers': {},
            'wall_time': 1700000000.0,
            'status': 200,
            'status_text': 'OK',
            'response_headers': {},
            'mime_type': 'text/html',
        }
        entry = recorder._build_entry(pending)
        assert entry['timings']['receive'] == 0


class TestHarRecorderEntryTimeSslExclusion:
    """Test that entry.time excludes ssl from sum (connect includes it)."""

    def test_entry_time_excludes_ssl(self, recorder):
        timing = {
            'requestTime': 12345.0,
            'proxyStart': -1,
            'proxyEnd': -1,
            'dnsStart': 0.5,
            'dnsEnd': 5.0,
            'connectStart': 5.0,
            'connectEnd': 50.0,
            'sslStart': 10.0,
            'sslEnd': 45.0,
            'workerStart': -1,
            'workerReady': -1,
            'workerFetchStart': -1,
            'workerRespondWithSettled': -1,
            'sendStart': 50.0,
            'sendEnd': 51.0,
            'pushStart': 0,
            'pushEnd': 0,
            'receiveHeadersStart': 100.0,
            'receiveHeadersEnd': 105.0,
        }
        pending = {
            'url': 'https://example.com',
            'method': 'GET',
            'request_headers': {},
            'wall_time': 1700000000.0,
            'status': 200,
            'status_text': 'OK',
            'response_headers': {},
            'mime_type': 'text/html',
            'timing': timing,
            'response_timestamp': 12346.0,
            'finished_timestamp': 12346.5,
        }
        entry = recorder._build_entry(pending)
        timings = entry['timings']
        # ssl=35.0, connect=45.0 (connect includes ssl time)
        # entry.time should NOT include ssl separately
        expected = (
            timings['blocked']
            + timings['dns']
            + timings['connect']
            + timings['send']
            + timings['wait']
            + timings['receive']
        )
        assert entry['time'] == round(expected, 2)
        # Verify ssl is NOT counted in total
        assert timings['ssl'] == 35.0
        assert timings['ssl'] not in (
            entry['time'] - timings['blocked'] - timings['dns']
            - timings['connect'] - timings['send'] - timings['wait']
            - timings['receive'],
        )


class TestHarRecorderEntryOrdering:
    """Test that entries are sorted by startedDateTime."""

    @pytest.mark.asyncio
    async def test_entries_sorted_by_started_date_time(self, recorder):
        recorder._entries.append({
            'startedDateTime': '2023-11-14T12:00:02+00:00',
            'time': 100.0,
            'request': {'method': 'GET', 'url': 'https://example.com/second'},
            'response': {'status': 200},
            'cache': {},
            'timings': {},
        })
        recorder._entries.append({
            'startedDateTime': '2023-11-14T12:00:01+00:00',
            'time': 50.0,
            'request': {'method': 'GET', 'url': 'https://example.com/first'},
            'response': {'status': 200},
            'cache': {},
            'timings': {},
        })
        recording = HarCapture(recorder)

        # entries property should be sorted
        entries = recording.entries
        assert entries[0]['request']['url'] == 'https://example.com/first'
        assert entries[1]['request']['url'] == 'https://example.com/second'

        # to_dict() should also be sorted
        har = recording.to_dict()
        assert har['log']['entries'][0]['request']['url'] == 'https://example.com/first'
        assert har['log']['entries'][1]['request']['url'] == 'https://example.com/second'


class TestHarRecorderBodySizeFallback:
    """Test bodySize fallback to content_size when body_bytes is 0."""

    @pytest.mark.asyncio
    async def test_body_size_falls_back_to_content_size(self, recorder):
        """When body_bytes=0 but content exists (e.g. file://), use content_size."""
        pending = {
            'url': 'file:///page.html',
            'method': 'GET',
            'request_headers': {},
            'wall_time': 1700000000.0,
            'status': 200,
            'status_text': 'OK',
            'response_headers': {},
            'mime_type': 'text/html',
            'response_body': '<html>Hello World</html>',
            'response_body_base64': False,
            'body_bytes': 0,
        }
        entry = recorder._build_entry(pending)
        expected_size = len('<html>Hello World</html>'.encode('utf-8'))
        assert entry['response']['bodySize'] == expected_size
        assert entry['response']['content']['size'] == expected_size

    @pytest.mark.asyncio
    async def test_body_size_negative_one_when_no_body_and_no_bytes(self, recorder):
        """When body_bytes=-1 and no content, bodySize should be -1."""
        pending = {
            'url': 'https://example.com',
            'method': 'GET',
            'request_headers': {},
            'wall_time': 1700000000.0,
            'status': 200,
            'status_text': 'OK',
            'response_headers': {},
            'mime_type': 'text/html',
            'body_bytes': -1,
        }
        entry = recorder._build_entry(pending)
        assert entry['response']['bodySize'] == -1


class TestHarRecorderHttpVersionNormalization:
    """Test httpVersion normalization for HAR compatibility."""

    def test_h2_stays_lowercase(self):
        assert HarRecorder._normalize_http_version('h2') == 'h2'

    def test_h3_stays_lowercase(self):
        assert HarRecorder._normalize_http_version('h3') == 'h3'

    def test_http_1_1_uppercased(self):
        assert HarRecorder._normalize_http_version('http/1.1') == 'HTTP/1.1'

    def test_http_1_0_uppercased(self):
        assert HarRecorder._normalize_http_version('http/1.0') == 'HTTP/1.0'

    def test_already_uppercase(self):
        assert HarRecorder._normalize_http_version('HTTP/1.1') == 'HTTP/1.1'

    def test_file_protocol_returns_empty(self):
        assert HarRecorder._normalize_http_version('file') == ''

    def test_empty_string(self):
        assert HarRecorder._normalize_http_version('') == ''

    def test_unknown_protocol_returns_empty(self):
        assert HarRecorder._normalize_http_version('blob') == ''

    def test_entry_uses_normalized_version(self, recorder):
        """Entry httpVersion should be normalized."""
        pending = {
            'url': 'https://example.com',
            'method': 'GET',
            'request_headers': {},
            'wall_time': 1700000000.0,
            'status': 200,
            'status_text': 'OK',
            'response_headers': {},
            'mime_type': 'text/html',
            'protocol': 'http/1.1',
        }
        entry = recorder._build_entry(pending)
        assert entry['request']['httpVersion'] == 'HTTP/1.1'
        assert entry['response']['httpVersion'] == 'HTTP/1.1'


================================================
FILE: tests/test_browser/test_requests_request.py
================================================
"""
Tests for pydoll.browser.requests.request module.
"""

import json
import pytest
import pytest_asyncio
from unittest.mock import AsyncMock, Mock, patch
from urllib.parse import urlencode

from pydoll.browser.requests.request import Request
from pydoll.browser.requests.response import Response
from pydoll.exceptions import HTTPError
from pydoll.protocol.fetch.types import HeaderEntry
from pydoll.protocol.network.events import NetworkEvent
from pydoll.protocol.network.types import CookieParam


@pytest_asyncio.fixture
async def mock_tab():
    """Create a mock Tab instance for testing."""
    tab = Mock()
    tab.network_events_enabled = False
    tab.enable_network_events = AsyncMock()
    tab.disable_network_events = AsyncMock()
    tab.remove_callback = AsyncMock()
    tab.on = AsyncMock(side_effect=lambda *a, **kw: len(tab.on.call_args_list))
    tab._execute_command = AsyncMock()
    return tab


@pytest_asyncio.fixture
async def request_instance(mock_tab):
    """Create a Request instance for testing."""
    return Request(mock_tab)


class TestRequestInitialization:
    """Test Request class initialization."""

    def test_request_initialization(self, mock_tab):
        """Test Request initialization with tab."""
        request = Request(mock_tab)
        
        assert request.tab == mock_tab
        assert request._network_events_enabled is False
        assert request._requests_sent == []
        assert request._requests_received == []

    def test_request_initialization_preserves_tab_reference(self, mock_tab):
        """Test that Request maintains reference to provided tab."""
        request = Request(mock_tab)
        assert request.tab is mock_tab


class TestRequestMethods:
    """Test HTTP method convenience functions."""

    @pytest.mark.asyncio
    async def test_get_method(self, request_instance):
        """Test GET request method."""
        with patch.object(request_instance, 'request', new_callable=AsyncMock) as mock_request:
            mock_request.return_value = Mock()
            
            await request_instance.get('https://example.com', params={'q': 'test'})
            
            mock_request.assert_called_once_with(
                'GET', 'https://example.com', params={'q': 'test'}
            )

    @pytest.mark.asyncio
    async def test_post_method(self, request_instance):
        """Test POST request method."""
        with patch.object(request_instance, 'request', new_callable=AsyncMock) as mock_request:
            mock_request.return_value = Mock()
            
            await request_instance.post(
                'https://example.com', 
                data={'key': 'value'}, 
                json={'json_key': 'json_value'}
            )
            
            mock_request.assert_called_once_with(
                'POST', 
                'https://example.com', 
                data={'key': 'value'}, 
                json={'json_key': 'json_value'}
            )

    @pytest.mark.asyncio
    async def test_put_method(self, request_instance):
        """Test PUT request method."""
        with patch.object(request_instance, 'request', new_callable=AsyncMock) as mock_request:
            mock_request.return_value = Mock()
            
            await request_instance.put('https://example.com', json={'update': 'data'})
            
            mock_request.assert_called_once_with(
                'PUT', 'https://example.com', data=None, json={'update': 'data'}
            )

    @pytest.mark.asyncio
    async def test_patch_method(self, request_instance):
        """Test PATCH request method."""
        with patch.object(request_instance, 'request', new_callable=AsyncMock) as mock_request:
            mock_request.return_value = Mock()
            
            await request_instance.patch('https://example.com', data='patch_data')
            
            mock_request.assert_called_once_with(
                'PATCH', 'https://example.com', data='patch_data', json=None
            )

    @pytest.mark.asyncio
    async def test_delete_method(self, request_instance):
        """Test DELETE request method."""
        with patch.object(request_instance, 'request', new_callable=AsyncMock) as mock_request:
            mock_request.return_value = Mock()
            
            await request_instance.delete('https://example.com')
            
            mock_request.assert_called_once_with('DELETE', 'https://example.com')

    @pytest.mark.asyncio
    async def test_head_method(self, request_instance):
        """Test HEAD request method."""
        with patch.object(request_instance, 'request', new_callable=AsyncMock) as mock_request:
            mock_request.return_value = Mock()
            
            await request_instance.head('https://example.com')
            
            mock_request.assert_called_once_with('HEAD', 'https://example.com')

    @pytest.mark.asyncio
    async def test_options_method(self, request_instance):
        """Test OPTIONS request method."""
        with patch.object(request_instance, 'request', new_callable=AsyncMock) as mock_request:
            mock_request.return_value = Mock()
            
            await request_instance.options('https://example.com')
            
            mock_request.assert_called_once_with('OPTIONS', 'https://example.com')


class TestRequestMainMethod:
    """Test main request method functionality."""

    @pytest.mark.asyncio
    async def test_request_success_flow(self, request_instance, mock_tab):
        """Test successful request execution flow."""
        # Mock execute_command response
        mock_result = {
            'result': {
                'result': {
                    'value': {
                        'status': 200,
                        'content': [72, 101, 108, 108, 111],  # "Hello" as bytes
                        'text': 'Hello',
                        'json': {'message': 'success'},
                        'url': 'https://example.com'
                    }
                }
            }
        }
        mock_tab._execute_command.return_value = mock_result
        
        # Mock helper methods
        with patch.object(request_instance, '_extract_received_headers') as mock_extract_headers, \
             patch.object(request_instance, '_extract_sent_headers') as mock_extract_sent, \
             patch.object(request_instance, '_extract_set_cookies') as mock_extract_cookies:
            
            mock_extract_headers.return_value = [HeaderEntry(name='Content-Type', value='application/json')]
            mock_extract_sent.return_value = [HeaderEntry(name='User-Agent', value='Test-Agent')]
            mock_extract_cookies.return_value = [CookieParam(name='session', value='abc123')]
            
            response = await request_instance.request('GET', 'https://example.com')
            
            assert isinstance(response, Response)
            assert response.status_code == 200
            assert response.text == 'Hello'
            assert response.json() == {'message': 'success'}
            assert response.url == 'https://example.com'

    @pytest.mark.asyncio
    async def test_request_with_params(self, request_instance):
        """Test request with query parameters."""
        with patch.object(request_instance, '_build_url_with_params') as mock_build_url, \
             patch.object(request_instance, '_execute_fetch_request') as mock_execute, \
             patch.object(request_instance, '_extract_received_headers') as mock_headers, \
             patch.object(request_instance, '_extract_sent_headers') as mock_sent, \
             patch.object(request_instance, '_extract_set_cookies') as mock_cookies, \
             patch.object(request_instance, '_build_response') as mock_build_response, \
             patch.object(request_instance, '_clear_callbacks') as mock_clear:
            
            mock_build_url.return_value = 'https://example.com?q=test'
            mock_execute.return_value = {'result': {'result': {'value': {}}}}
            mock_headers.return_value = []
            mock_sent.return_value = []
            mock_cookies.return_value = []
            mock_build_response.return_value = Mock()
            
            await request_instance.request('GET', 'https://example.com', params={'q': 'test'})
            
            mock_build_url.assert_called_once_with('https://example.com', {'q': 'test'})

    @pytest.mark.asyncio
    async def test_request_with_json_data(self, request_instance):
        """Test request with JSON data."""
        with patch.object(request_instance, '_build_request_options') as mock_build_options, \
             patch.object(request_instance, '_execute_fetch_request') as mock_execute, \
             patch.object(request_instance, '_extract_received_headers') as mock_headers, \
             patch.object(request_instance, '_extract_sent_headers') as mock_sent, \
             patch.object(request_instance, '_extract_set_cookies') as mock_cookies, \
             patch.object(request_instance, '_build_response') as mock_build_response, \
             patch.object(request_instance, '_clear_callbacks') as mock_clear:
            
            mock_execute.return_value = {'result': {'result': {'value': {}}}}
            mock_headers.return_value = []
            mock_sent.return_value = []
            mock_cookies.return_value = []
            mock_build_response.return_value = Mock()
            
            json_data = {'key': 'value'}
            await request_instance.request('POST', 'https://example.com', json=json_data)
            
            mock_build_options.assert_called_once_with(
                'POST', None, json_data, None
            )

    @pytest.mark.asyncio
    async def test_request_failure_raises_http_error(self, request_instance, mock_tab):
        """Test that request failures raise HTTPError."""
        mock_tab._execute_command.side_effect = Exception("Network error")
        
        with pytest.raises(HTTPError, match="Request failed: Network error"):
            await request_instance.request('GET', 'https://example.com')

    @pytest.mark.asyncio
    async def test_request_always_clears_callbacks(self, request_instance, mock_tab):
        """Test that callbacks are always cleared, even on error."""
        mock_tab._execute_command.side_effect = Exception("Network error")
        
        with patch.object(request_instance, '_clear_callbacks') as mock_clear:
            with pytest.raises(HTTPError):
                await request_instance.request('GET', 'https://example.com')
            
            mock_clear.assert_called_once()


class TestRequestHelperMethods:
    """Test Request helper methods."""

    def test_build_url_with_params_no_params(self, request_instance):
        """Test URL building without parameters."""
        url = 'https://example.com'
        result = request_instance._build_url_with_params(url, None)
        assert result == url

    def test_build_url_with_params_simple(self, request_instance):
        """Test URL building with simple parameters."""
        url = 'https://example.com'
        params = {'q': 'test', 'page': '1'}
        result = request_instance._build_url_with_params(url, params)
        
        assert 'https://example.com?' in result
        assert 'q=test' in result
        assert 'page=1' in result

    def test_build_url_with_params_existing_query(self, request_instance):
        """Test URL building with existing query string."""
        url = 'https://example.com?existing=param'
        params = {'new': 'value'}
        result = request_instance._build_url_with_params(url, params)
        
        assert 'existing=param' in result
        assert 'new=value' in result

    def test_build_request_options_basic(self, request_instance):
        """Test basic request options building."""
        options = request_instance._build_request_options(
            'GET', None, None, None
        )
        
        assert options['method'] == 'GET'
        assert options['headers'] == {}

    def test_build_request_options_with_headers(self, request_instance):
        """Test request options building with headers."""
        headers = [HeaderEntry(name='Authorization', value='Bearer token')]
        
        with patch.object(request_instance, '_convert_header_entries_to_dict') as mock_convert:
            mock_convert.return_value = {'Authorization': 'Bearer token'}
            
            options = request_instance._build_request_options(
                'POST', headers, None, None
            )
            
            assert options['headers'] == {'Authorization': 'Bearer token'}
            mock_convert.assert_called_once_with(headers)

    def test_handle_json_options(self, request_instance):
        """Test JSON data handling."""
        options = {'headers': {}}
        json_data = {'key': 'value'}
        
        request_instance._handle_json_options(options, json_data)
        
        assert options['body'] == json.dumps(json_data)
        assert options['headers']['Content-Type'] == 'application/json'

    def test_handle_data_options_form_data(self, request_instance):
        """Test form data handling."""
        options = {'headers': {}}
        data = {'key': 'value', 'key2': 'value2'}
        
        request_instance._handle_data_options(options, data)
        
        assert options['body'] == urlencode(data, doseq=True)
        assert options['headers']['Content-Type'] == 'application/x-www-form-urlencoded'

    def test_handle_data_options_raw_data(self, request_instance):
        """Test raw data handling."""
        options = {'headers': {}}
        data = 'raw string data'
        
        request_instance._handle_data_options(options, data)
        
        assert options['body'] == data
        assert 'Content-Type' not in options['headers']

    def test_convert_header_entries_to_dict(self, request_instance):
        """Test header entries conversion to dictionary."""
        headers = [
            HeaderEntry(name='Content-Type', value='application/json'),
            HeaderEntry(name='Authorization', value='Bearer token')
        ]
        
        result = request_instance._convert_header_entries_to_dict(headers)
        
        expected = {
            'Content-Type': 'application/json',
            'Authorization': 'Bearer token'
        }
        assert result == expected

    def test_convert_dict_to_header_entries(self, request_instance):
        """Test dictionary conversion to header entries."""
        headers_dict = {
            'Content-Type': 'application/json',
            'Authorization': 'Bearer token'
        }
        
        result = request_instance._convert_dict_to_header_entries(headers_dict)
        
        assert len(result) == 2
        # Check that each result is a dictionary with the expected keys
        for header in result:
            assert 'name' in header
            assert 'value' in header
        assert {header['name']: header['value'] for header in result} == headers_dict


class TestRequestCallbackManagement:
    """Test callback registration and management."""

    @pytest.mark.asyncio
    async def test_register_callbacks_enables_network_events(self, request_instance, mock_tab):
        """Test that registering callbacks enables network events."""
        mock_tab.network_events_enabled = False
        
        await request_instance._register_callbacks()
        
        mock_tab.enable_network_events.assert_called_once()
        assert request_instance._network_events_enabled is True

    @pytest.mark.asyncio
    async def test_register_callbacks_skips_if_already_enabled(self, request_instance, mock_tab):
        """Test that network events are not re-enabled if already active."""
        mock_tab.network_events_enabled = True
        
        await request_instance._register_callbacks()
        
        mock_tab.enable_network_events.assert_not_called()
        assert request_instance._network_events_enabled is False

    @pytest.mark.asyncio
    async def test_register_callbacks_subscribes_to_events(self, request_instance, mock_tab):
        """Test that all required network events are subscribed to."""
        await request_instance._register_callbacks()
        
        expected_events = [
            NetworkEvent.REQUEST_WILL_BE_SENT,
            NetworkEvent.REQUEST_WILL_BE_SENT_EXTRA_INFO,
            NetworkEvent.RESPONSE_RECEIVED,
            NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO
        ]
        
        assert mock_tab.on.call_count == len(expected_events)
        called_events = [call[0][0] for call in mock_tab.on.call_args_list]
        
        for event in expected_events:
            assert event in called_events

    @pytest.mark.asyncio
    async def test_clear_callbacks_disables_network_events(self, request_instance, mock_tab):
        """Test that clearing callbacks disables network events if they were enabled."""
        request_instance._network_events_enabled = True
        request_instance._callback_ids = [10, 11, 12, 13]

        await request_instance._clear_callbacks()

        mock_tab.disable_network_events.assert_called_once()
        assert mock_tab.remove_callback.call_count == 4
        assert request_instance._network_events_enabled is False
        assert request_instance._callback_ids == []

    @pytest.mark.asyncio
    async def test_clear_callbacks_skips_disable_if_not_enabled(self, request_instance, mock_tab):
        """Test that network events are not disabled if not enabled by request."""
        request_instance._network_events_enabled = False
        request_instance._callback_ids = [10, 11]

        await request_instance._clear_callbacks()

        mock_tab.disable_network_events.assert_not_called()
        assert mock_tab.remove_callback.call_count == 2
        assert request_instance._callback_ids == []


class TestRequestCookieExtraction:
    """Test cookie extraction functionality."""

    def test_parse_cookie_line_valid(self, request_instance):
        """Test parsing valid cookie line."""
        line = 'session_id=abc123; Path=/; HttpOnly'
        
        result = request_instance._parse_cookie_line(line)
        
        assert result is not None
        assert result['name'] == 'session_id'
        assert result['value'] == 'abc123'

    def test_parse_cookie_line_invalid(self, request_instance):
        """Test parsing invalid cookie line."""
        line = 'invalid_cookie_without_equals'
        
        result = request_instance._parse_cookie_line(line)
        
        assert result is None

    def test_parse_cookie_line_with_complex_value(self, request_instance):
        """Test parsing cookie with complex value."""
        line = 'complex=value=with=equals; Secure'
        
        result = request_instance._parse_cookie_line(line)
        
        assert result is not None
        assert result['name'] == 'complex'
        assert result['value'] == 'value=with=equals'

    def test_add_unique_cookies_no_duplicates(self, request_instance):
        """Test adding unique cookies without duplicates."""
        existing_cookies = [CookieParam(name='existing', value='value1')]
        new_cookies = [
            CookieParam(name='new', value='value2'),
            CookieParam(name='existing', value='value1')  # Duplicate
        ]
        
        request_instance._add_unique_cookies(existing_cookies, new_cookies)
        
        assert len(existing_cookies) == 2
        cookie_names = [cookie['name'] for cookie in existing_cookies]
        assert 'existing' in cookie_names
        assert 'new' in cookie_names

    def test_parse_set_cookie_header_multiline(self, request_instance):
        """Test parsing multi-line Set-Cookie header."""
        header = 'cookie1=value1; Path=/\ncookie2=value2; Secure'
        
        result = request_instance._parse_set_cookie_header(header)
        
        assert len(result) == 2
        assert result[0]['name'] == 'cookie1'
        assert result[1]['name'] == 'cookie2'


class TestRequestEdgeCases:
    """Test edge cases and error conditions."""

    @pytest.mark.asyncio
    async def test_request_with_empty_url(self, request_instance):
        """Test request with empty URL."""
        with patch.object(request_instance, '_execute_fetch_request') as mock_execute, \
             patch.object(request_instance, '_extract_received_headers') as mock_headers, \
             patch.object(request_instance, '_extract_sent_headers') as mock_sent, \
             patch.object(request_instance, '_extract_set_cookies') as mock_cookies, \
             patch.object(request_instance, '_build_response') as mock_build_response, \
             patch.object(request_instance, '_clear_callbacks') as mock_clear:
            
            mock_execute.return_value = {'result': {'result': {'value': {}}}}
            mock_headers.return_value = []
            mock_sent.return_value = []
            mock_cookies.return_value = []
            mock_build_response.return_value = Mock()
            
            await request_instance.request('GET', '')
            
            mock_execute.assert_called_once()

    def test_build_url_with_special_characters(self, request_instance):
        """Test URL building with special characters in parameters."""
        url = 'https://example.com'
        params = {'q': 'hello world', 'special': 'value&with=chars'}
        
        result = request_instance._build_url_with_params(url, params)
        
        assert 'hello+world' in result or 'hello%20world' in result
        assert 'value%26with%3Dchars' in result

    def test_handle_data_options_with_bytes(self, request_instance):
        """Test handling raw bytes data."""
        options = {'headers': {}}
        data = b'binary data'
        
        request_instance._handle_data_options(options, data)
        
        assert options['body'] == data
        assert 'Content-Type' not in options['headers']

    def test_convert_header_entries_empty_list(self, request_instance):
        """Test converting empty header entries list."""
        result = request_instance._convert_header_entries_to_dict([])
        assert result == {}

    def test_convert_dict_to_header_entries_empty_dict(self, request_instance):
        """Test converting empty dictionary to header entries."""
        result = request_instance._convert_dict_to_header_entries({})
        assert result == []


class TestRequestHeaderExtraction:
    """Test header extraction methods from network events."""

    def test_extract_received_headers(self, request_instance):
        """Test _extract_received_headers method."""
        from pydoll.protocol.network.events import NetworkEvent
        
        # Mock network events with response headers
        mock_response_event = {
            'method': NetworkEvent.RESPONSE_RECEIVED,
            'params': {
                'response': {
                    'headers': {
                        'Content-Type': 'application/json',
                        'Content-Length': '100',
                        'Server': 'nginx/1.18.0'
                    }
                }
            }
        }
        
        mock_response_extra_event = {
            'method': NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO,
            'params': {
                'blockedCookies': [],
                'headers': {
                    'Set-Cookie': 'session=abc123; Path=/',
                    'X-Custom-Header': 'custom-value'
                }
            }
        }
        
        # Set up mock events
        request_instance._requests_received = [mock_response_event, mock_response_extra_event]
        
        # Extract headers
        headers = request_instance._extract_received_headers()
        
        # Verify headers were extracted
        assert len(headers) >= 3  # At least Content-Type, Content-Length, Server
        header_dict = {h['name']: h['value'] for h in headers}
        
        assert 'Content-Type' in header_dict
        assert header_dict['Content-Type'] == 'application/json'
        assert 'Content-Length' in header_dict
        assert header_dict['Content-Length'] == '100'
        assert 'Server' in header_dict
        assert header_dict['Server'] == 'nginx/1.18.0'

    def test_extract_sent_headers(self, request_instance):
        """Test _extract_sent_headers method."""
        from pydoll.protocol.network.events import NetworkEvent
        
        # Mock network events with request headers
        mock_request_event = {
            'method': NetworkEvent.REQUEST_WILL_BE_SENT,
            'params': {
                'request': {
                    'headers': {
                        'User-Agent': 'PyDoll/1.0',
                        'Accept': 'application/json',
                        'Authorization': 'Bearer token123'
                    }
                }
            }
        }
        
        mock_request_extra_event = {
            'method': NetworkEvent.REQUEST_WILL_BE_SENT_EXTRA_INFO,
            'params': {
                'associatedCookies': [],
                'headers': {
                    'X-Forwarded-For': '192.168.1.1',
                    'X-Custom-Request': 'test-value'
                }
            }
        }
        
        # Set up mock events
        request_instance._requests_sent = [mock_request_event, mock_request_extra_event]
        
        # Extract headers
        headers = request_instance._extract_sent_headers()
        
        # Verify headers were extracted
        assert len(headers) >= 3  # At least User-Agent, Accept, Authorization
        header_dict = {h['name']: h['value'] for h in headers}
        
        assert 'User-Agent' in header_dict
        assert header_dict['User-Agent'] == 'PyDoll/1.0'
        assert 'Accept' in header_dict
        assert header_dict['Accept'] == 'application/json'
        assert 'Authorization' in header_dict
        assert header_dict['Authorization'] == 'Bearer token123'

    def test_extract_headers_from_events_with_response_events(self, request_instance):
        """Test _extract_headers_from_events with response events."""
        from pydoll.protocol.network.events import NetworkEvent
        
        # Mock response events
        events = [
            {
                'method': NetworkEvent.RESPONSE_RECEIVED,
                'params': {
                    'response': {
                        'headers': {
                            'Content-Type': 'text/html',
                            'Cache-Control': 'no-cache'
                        }
                    }
                }
            },
            {
                'method': NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO,
                'params': {
                    'blockedCookies': [],
                    'headers': {
                        'X-Frame-Options': 'DENY',
                        'Strict-Transport-Security': 'max-age=31536000'
                    }
                }
            }
        ]
        
        # Define extractors for response events
        event_extractors = {
            'response': request_instance._extract_response_received_headers,
            'blockedCookies': request_instance._extract_response_received_extra_info_headers,
        }
        
        # Extract headers from events
        headers = request_instance._extract_headers_from_events(events, event_extractors)
        
        # Verify headers were extracted and deduplicated
        assert len(headers) == 4  # Content-Type, Cache-Control, X-Frame-Options, Strict-Transport-Security
        header_dict = {h['name']: h['value'] for h in headers}
        
        assert header_dict['Content-Type'] == 'text/html'
        assert header_dict['Cache-Control'] == 'no-cache'
        assert header_dict['X-Frame-Options'] == 'DENY'
        assert header_dict['Strict-Transport-Security'] == 'max-age=31536000'

    def test_extract_headers_from_events_with_request_events(self, request_instance):
        """Test _extract_headers_from_events with request events."""
        from pydoll.protocol.network.events import NetworkEvent
        
        # Mock request events
        events = [
            {
                'method': NetworkEvent.REQUEST_WILL_BE_SENT,
                'params': {
                    'request': {
                        'headers': {
                            'Host': 'api.example.com',
                            'Connection': 'keep-alive'
                        }
                    }
                }
            },
            {
                'method': NetworkEvent.REQUEST_WILL_BE_SENT_EXTRA_INFO,
                'params': {
                    'associatedCookies': [],
                    'headers': {
                        'Accept-Encoding': 'gzip, deflate',
                        'Accept-Language': 'en-US,en;q=0.9'
                    }
                }
            }
        ]
        
        # Define extractors for request events
        event_extractors = {
            'request': request_instance._extract_request_sent_headers,
            'associatedCookies': request_instance._extract_request_sent_extra_info_headers,
        }
        
        # Extract headers from events
        headers = request_instance._extract_headers_from_events(events, event_extractors)
        
        # Verify headers were extracted
        assert len(headers) == 4  # Host, Connection, Accept-Encoding, Accept-Language
        header_dict = {h['name']: h['value'] for h in headers}
        
        assert header_dict['Host'] == 'api.example.com'
        assert header_dict['Connection'] == 'keep-alive'
        assert header_dict['Accept-Encoding'] == 'gzip, deflate'
        assert header_dict['Accept-Language'] == 'en-US,en;q=0.9'

    def test_extract_headers_from_events_deduplication(self, request_instance):
        """Test that _extract_headers_from_events deduplicates headers correctly."""
        from pydoll.protocol.network.events import NetworkEvent
        
        # Mock events with duplicate headers
        events = [
            {
                'method': NetworkEvent.RESPONSE_RECEIVED,
                'params': {
                    'response': {
                        'headers': {
                            'Content-Type': 'application/json',
                            'Server': 'nginx'
                        }
                    }
                }
            },
            {
                'method': NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO,
                'params': {
                    'blockedCookies': [],
                    'headers': {
                        'Content-Type': 'application/json',  # Duplicate
                        'X-Custom': 'value'
                    }
                }
            }
        ]
        
        event_extractors = {
            'response': request_instance._extract_response_received_headers,
            'blockedCookies': request_instance._extract_response_received_extra_info_headers,
        }
        
        # Extract headers
        headers = request_instance._extract_headers_from_events(events, event_extractors)
        
        # Verify deduplication - Content-Type should appear only once
        header_names = [h['name'] for h in headers]
        assert header_names.count('Content-Type') == 1
        assert len(headers) == 3  # Content-Type (deduplicated), Server, X-Custom

    def test_extract_headers_from_events_empty_events(self, request_instance):
        """Test _extract_headers_from_events with empty events list."""
        event_extractors = {
            'response': request_instance._extract_response_received_headers,
        }
        
        # Extract headers from empty events
        headers = request_instance._extract_headers_from_events([], event_extractors)
        
        # Should return empty list
        assert headers == []

    def test_extract_headers_from_events_no_matching_keys(self, request_instance):
        """Test _extract_headers_from_events when no event keys match extractors."""
        from pydoll.protocol.network.events import NetworkEvent
        
        # Mock event with keys that don't match extractors
        events = [
            {
                'method': NetworkEvent.RESPONSE_RECEIVED,
                'params': {
                    'someOtherKey': {
                        'headers': {
                            'Content-Type': 'application/json'
                        }
                    }
                }
            }
        ]
        
        event_extractors = {
            'response': request_instance._extract_response_received_headers,
        }
        
        # Extract headers
        headers = request_instance._extract_headers_from_events(events, event_extractors)
        
        # Should return empty list since no keys match
        assert headers == []

    def test_extract_request_sent_headers(self, request_instance):
        """Test _extract_request_sent_headers method."""
        # Mock request params
        params = {
            'request': {
                'headers': {
                    'User-Agent': 'Mozilla/5.0',
                    'Accept': '*/*',
                    'Content-Type': 'application/json',
                    'Authorization': 'Bearer secret-token'
                }
            },
            'otherData': 'should be ignored'
        }
        
        # Extract headers
        headers = request_instance._extract_request_sent_headers(params)
        
        # Verify headers were extracted correctly
        assert len(headers) == 4
        header_dict = {h['name']: h['value'] for h in headers}
        
        assert header_dict['User-Agent'] == 'Mozilla/5.0'
        assert header_dict['Accept'] == '*/*'
        assert header_dict['Content-Type'] == 'application/json'
        assert header_dict['Authorization'] == 'Bearer secret-token'

    def test_extract_request_sent_headers_empty_headers(self, request_instance):
        """Test _extract_request_sent_headers with empty headers."""
        params = {
            'request': {
                'headers': {}
            }
        }
        
        headers = request_instance._extract_request_sent_headers(params)
        assert headers == []

    def test_extract_request_sent_headers_missing_headers_key(self, request_instance):
        """Test _extract_request_sent_headers when headers key is missing."""
        params = {
            'request': {
                'url': 'https://example.com',
                'method': 'GET'
            }
        }
        
        headers = request_instance._extract_request_sent_headers(params)
        assert headers == []

    def test_extract_request_sent_extra_info_headers(self, request_instance):
        """Test _extract_request_sent_extra_info_headers method."""
        # Mock extra info params
        params = {
            'headers': {
                'X-Forwarded-For': '10.0.0.1',
                'X-Real-IP': '192.168.1.100',
                'X-Custom-Header': 'extra-info-value'
            },
            'associatedCookies': [],
            'otherData': 'should be ignored'
        }
        
        # Extract headers
        headers = request_instance._extract_request_sent_extra_info_headers(params)
        
        # Verify headers were extracted correctly
        assert len(headers) == 3
        header_dict = {h['name']: h['value'] for h in headers}
        
        assert header_dict['X-Forwarded-For'] == '10.0.0.1'
        assert header_dict['X-Real-IP'] == '192.168.1.100'
        assert header_dict['X-Custom-Header'] == 'extra-info-value'

    def test_extract_request_sent_extra_info_headers_empty(self, request_instance):
        """Test _extract_request_sent_extra_info_headers with empty headers."""
        params = {
            'headers': {},
            'associatedCookies': []
        }
        
        headers = request_instance._extract_request_sent_extra_info_headers(params)
        assert headers == []

    def test_extract_request_sent_extra_info_headers_missing_headers(self, request_instance):
        """Test _extract_request_sent_extra_info_headers when headers key is missing."""
        params = {
            'associatedCookies': [],
            'otherData': 'value'
        }
        
        headers = request_instance._extract_request_sent_extra_info_headers(params)
        assert headers == []

    def test_extract_response_received_headers(self, request_instance):
        """Test _extract_response_received_headers method."""
        # Mock response params
        params = {
            'response': {
                'headers': {
                    'Content-Type': 'text/html; charset=utf-8',
                    'Content-Length': '1024',
                    'Last-Modified': 'Wed, 21 Oct 2015 07:28:00 GMT',
                    'ETag': '"33a64df551425fcc55e4d42a148795d9f25f89d4"'
                }
            },
            'otherData': 'should be ignored'
        }
        
        # Extract headers
        headers = request_instance._extract_response_received_headers(params)
        
        # Verify headers were extracted correctly
        assert len(headers) == 4
        header_dict = {h['name']: h['value'] for h in headers}
        
        assert header_dict['Content-Type'] == 'text/html; charset=utf-8'
        assert header_dict['Content-Length'] == '1024'
        assert header_dict['Last-Modified'] == 'Wed, 21 Oct 2015 07:28:00 GMT'
        assert header_dict['ETag'] == '"33a64df551425fcc55e4d42a148795d9f25f89d4"'

    def test_extract_response_received_extra_info_headers(self, request_instance):
        """Test _extract_response_received_extra_info_headers method."""
        # Mock response extra info params
        params = {
            'headers': {
                'Set-Cookie': 'sessionid=abc123; HttpOnly; Secure',
                'X-Content-Type-Options': 'nosniff',
                'X-XSS-Protection': '1; mode=block',
                'Referrer-Policy': 'strict-origin-when-cross-origin'
            },
            'blockedCookies': [],
            'otherData': 'should be ignored'
        }
        
        # Extract headers
        headers = request_instance._extract_response_received_extra_info_headers(params)
        
        # Verify headers were extracted correctly
        assert len(headers) == 4
        header_dict = {h['name']: h['value'] for h in headers}
        
        assert header_dict['Set-Cookie'] == 'sessionid=abc123; HttpOnly; Secure'
        assert header_dict['X-Content-Type-Options'] == 'nosniff'
        assert header_dict['X-XSS-Protection'] == '1; mode=block'
        assert header_dict['Referrer-Policy'] == 'strict-origin-when-cross-origin'

    def test_header_extraction_with_complex_values(self, request_instance):
        """Test header extraction with complex header values."""
        from pydoll.protocol.network.events import NetworkEvent
        
        # Mock event with complex header values
        events = [
            {
                'method': NetworkEvent.RESPONSE_RECEIVED,
                'params': {
                    'response': {
                        'headers': {
                            'Content-Security-Policy': "default-src 'self'; script-src 'self' 'unsafe-inline'; style-src 'self' 'unsafe-inline'",
                            'Link': '</css/style.css>; rel=preload; as=style, </js/app.js>; rel=preload; as=script',
                            'Cache-Control': 'public, max-age=3600, s-maxage=7200, must-revalidate',
                        }
                    }
                }
            }
        ]
        
        event_extractors = {
            'response': request_instance._extract_response_received_headers,
        }
        
        # Extract headers
        headers = request_instance._extract_headers_from_events(events, event_extractors)
        
        # Verify complex values are preserved
        header_dict = {h['name']: h['value'] for h in headers}
        
        assert 'Content-Security-Policy' in header_dict
        assert "default-src 'self'" in header_dict['Content-Security-Policy']
        assert 'Link' in header_dict
        assert 'rel=preload' in header_dict['Link']
        assert 'Cache-Control' in header_dict
        assert 'must-revalidate' in header_dict['Cache-Control']

    def test_header_extraction_integration_flow(self, request_instance):
        """Test complete header extraction flow for both sent and received headers."""
        from pydoll.protocol.network.events import NetworkEvent
        
        # Set up complete request/response flow
        request_instance._requests_sent = [
            {
                'method': NetworkEvent.REQUEST_WILL_BE_SENT,
                'params': {
                    'request': {
                        'headers': {
                            'Host': 'api.example.com',
                            'User-Agent': 'PyDoll/1.0',
                            'Accept': 'application/json'
                        }
                    }
                }
            }
        ]
        
        request_instance._requests_received = [
            {
                'method': NetworkEvent.RESPONSE_RECEIVED,
                'params': {
                    'response': {
                        'headers': {
                            'Content-Type': 'application/json',
                            'Server': 'nginx/1.18.0',
                            'Content-Length': '256'
                        }
                    }
                }
            }
        ]
        
        # Extract both sent and received headers
        sent_headers = request_instance._extract_sent_headers()
        received_headers = request_instance._extract_received_headers()
        
        # Verify sent headers
        sent_dict = {h['name']: h['value'] for h in sent_headers}
        assert sent_dict['Host'] == 'api.example.com'
        assert sent_dict['User-Agent'] == 'PyDoll/1.0'
        assert sent_dict['Accept'] == 'application/json'
        
        # Verify received headers
        received_dict = {h['name']: h['value'] for h in received_headers}
        assert received_dict['Content-Type'] == 'application/json'
        assert received_dict['Server'] == 'nginx/1.18.0'
        assert received_dict['Content-Length'] == '256'
        
        # Verify they are separate
        assert len(sent_headers) == 3
        assert len(received_headers) == 3
        assert sent_headers != received_headers

    def test_filter_response_extra_info_events(self, request_instance):
        """Test _filter_response_extra_info_events method."""
        from pydoll.protocol.network.events import NetworkEvent
        
        # Mock events with different types
        events = [
            {
                'method': NetworkEvent.RESPONSE_RECEIVED,
                'params': {'response': {'headers': {}}}
            },
            {
                'method': NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO,
                'params': {
                    'headers': {'Set-Cookie': 'session=abc123; Path=/'},
                    'blockedCookies': []
                }
            },
            {
                'method': NetworkEvent.REQUEST_WILL_BE_SENT,
                'params': {'request': {'headers': {}}}
            },
            {
                'method': NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO,
                'params': {
                    'headers': {'Set-Cookie': 'token=xyz789; Secure'},
                    'blockedCookies': []
                }
            }
        ]
        
        # Set up mock requests_received with the events
        request_instance._requests_received = events
        
        # Filter for response extra info events
        filtered_events = request_instance._filter_response_extra_info_events()
        
        # Should only return RESPONSE_RECEIVED_EXTRA_INFO events
        assert len(filtered_events) == 2
        
        for event in filtered_events:
            assert event['method'] == NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO
            assert 'headers' in event['params']
            assert 'Set-Cookie' in event['params']['headers']

    def test_filter_response_extra_info_events_empty(self, request_instance):
        """Test _filter_response_extra_info_events with no matching events."""
        from pydoll.protocol.network.events import NetworkEvent
        
        # Mock events without RESPONSE_RECEIVED_EXTRA_INFO
        events = [
            {
                'method': NetworkEvent.RESPONSE_RECEIVED,
                'params': {'response': {'headers': {}}}
            },
            {
                'method': NetworkEvent.REQUEST_WILL_BE_SENT,
                'params': {'request': {'headers': {}}}
            }
        ]
        
        request_instance._requests_received = events
        
        # Filter for response extra info events
        filtered_events = request_instance._filter_response_extra_info_events()
        
        # Should return empty list
        assert filtered_events == []

    def test_filter_response_extra_info_events_no_events(self, request_instance):
        """Test _filter_response_extra_info_events with empty events list."""
        request_instance._requests_received = []
        
        # Filter for response extra info events
        filtered_events = request_instance._filter_response_extra_info_events()
        
        # Should return empty list
        assert filtered_events == []

    def test_extract_set_cookies_basic(self, request_instance):
        """Test _extract_set_cookies method with basic cookies."""
        from pydoll.protocol.network.events import NetworkEvent
        
        # Mock events with Set-Cookie headers
        events = [
            {
                'method': NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO,
                'params': {
                    'headers': {
                        'Set-Cookie': 'sessionid=abc123; Path=/; HttpOnly',
                        'Content-Type': 'application/json'
                    },
                    'blockedCookies': []
                }
            },
            {
                'method': NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO,
                'params': {
                    'headers': {
                        'Set-Cookie': 'userid=456; Domain=.example.com; Secure',
                        'X-Custom': 'value'
                    },
                    'blockedCookies': []
                }
            }
        ]
        
        request_instance._requests_received = events
        
        # Extract cookies
        cookies = request_instance._extract_set_cookies()
        
        # Should have 2 cookies
        assert len(cookies) == 2
        
        # Check first cookie (only name and value are extracted)
        cookie1 = next(c for c in cookies if c['name'] == 'sessionid')
        assert cookie1['value'] == 'abc123'
        
        # Check second cookie (only name and value are extracted)
        cookie2 = next(c for c in cookies if c['name'] == 'userid')
        assert cookie2['value'] == '456'

    def test_extract_set_cookies_multiple_cookies_same_header(self, request_instance):
        """Test _extract_set_cookies with multiple cookies in same Set-Cookie header."""
        from pydoll.protocol.network.events import NetworkEvent
        
        # Mock event with multiple cookies in one header (newline-separated, not comma)
        events = [
            {
                'method': NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO,
                'params': {
                    'headers': {
                        'Set-Cookie': 'cookie1=value1; Path=/\ncookie2=value2; HttpOnly\ncookie3=value3; Secure'
                    },
                    'blockedCookies': []
                }
            }
        ]
        
        request_instance._requests_received = events
        
        # Extract cookies
        cookies = request_instance._extract_set_cookies()
        
        # Should have 3 cookies (split by newline)
        assert len(cookies) == 3
        
        cookie_names = [c['name'] for c in cookies]
        assert 'cookie1' in cookie_names
        assert 'cookie2' in cookie_names
        assert 'cookie3' in cookie_names
        
        # Check values (attributes are ignored)
        cookie1 = next(c for c in cookies if c['name'] == 'cookie1')
        assert cookie1['value'] == 'value1'
        
        cookie2 = next(c for c in cookies if c['name'] == 'cookie2')
        assert cookie2['value'] == 'value2'
        
        cookie3 = next(c for c in cookies if c['name'] == 'cookie3')
        assert cookie3['value'] == 'value3'

    def test_extract_set_cookies_duplicate_names(self, request_instance):
        """Test _extract_set_cookies with duplicate cookie names (should be deduplicated)."""
        from pydoll.protocol.network.events import NetworkEvent
        
        # Mock events with duplicate cookie names
        events = [
            {
                'method': NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO,
                'params': {
                    'headers': {
                        'Set-Cookie': 'sessionid=first_value; Path=/admin'
                    },
                    'blockedCookies': []
                }
            },
            {
                'method': NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO,
                'params': {
                    'headers': {
                        'Set-Cookie': 'sessionid=second_value; Path=/user'
                    },
                    'blockedCookies': []
                }
            }
        ]
        
        request_instance._requests_received = events
        
        # Extract cookies
        cookies = request_instance._extract_set_cookies()
        
        # Should have 2 cookies (different values, so not deduplicated by object equality)
        assert len(cookies) == 2
        cookie_names = [c['name'] for c in cookies]
        assert cookie_names.count('sessionid') == 2
        
        # Both cookies should be present with different values
        values = [c['value'] for c in cookies if c['name'] == 'sessionid']
        assert 'first_value' in values
        assert 'second_value' in values

    def test_extract_set_cookies_complex_values(self, request_instance):
        """Test _extract_set_cookies with complex cookie values and attributes."""
        from pydoll.protocol.network.events import NetworkEvent
        
        # Mock event with complex cookie attributes
        events = [
            {
                'method': NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO,
                'params': {
                    'headers': {
                        'Set-Cookie': 'auth_token=eyJhbGciOiJIUzI1NiIsInR5cCI6IkpXVCJ9; Domain=api.example.com; Path=/api; Secure; HttpOnly; SameSite=Strict; Max-Age=3600'
                    },
                    'blockedCookies': []
                }
            }
        ]
        
        request_instance._requests_received = events
        
        # Extract cookies
        cookies = request_instance._extract_set_cookies()
        
        # Should have 1 cookie (only name and value extracted)
        assert len(cookies) == 1
        cookie = cookies[0]
        
        assert cookie['name'] == 'auth_token'
        assert cookie['value'] == 'eyJhbGciOiJIUzI1NiIsInR5cCI6IkpXVCJ9'
        # Attributes like domain, path, secure, etc. are ignored by the implementation

    def test_extract_set_cookies_no_set_cookie_headers(self, request_instance):
        """Test _extract_set_cookies when no Set-Cookie headers are present."""
        from pydoll.protocol.network.events import NetworkEvent
        
        # Mock events without Set-Cookie headers
        events = [
            {
                'method': NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO,
                'params': {
                    'headers': {
                        'Content-Type': 'application/json',
                        'X-Custom-Header': 'value'
                    },
                    'blockedCookies': []
                }
            }
        ]
        
        request_instance._requests_received = events
        
        # Extract cookies
        cookies = request_instance._extract_set_cookies()
        
        # Should return empty list
        assert cookies == []

    def test_extract_set_cookies_empty_events(self, request_instance):
        """Test _extract_set_cookies with empty events list."""
        request_instance._requests_received = []
        
        # Extract cookies
        cookies = request_instance._extract_set_cookies()
        
        # Should return empty list
        assert cookies == []

    def test_extract_set_cookies_malformed_cookies(self, request_instance):
        """Test _extract_set_cookies with malformed cookie strings."""
        from pydoll.protocol.network.events import NetworkEvent
        
        # Mock event with malformed cookies (newline-separated to match implementation)
        events = [
            {
                'method': NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO,
                'params': {
                    'headers': {
                        'Set-Cookie': 'valid_cookie=value123; Path=/\nmalformed_cookie_no_value\n=empty_name_cookie; HttpOnly\nanother_valid=test'
                    },
                    'blockedCookies': []
                }
            }
        ]
        
        request_instance._requests_received = events
        
        # Extract cookies
        cookies = request_instance._extract_set_cookies()
        
        # Should only extract valid cookies (2 valid ones - those with non-empty names)
        # The implementation rejects cookies with empty names
        assert len(cookies) == 2
        
        cookie_names = [c['name'] for c in cookies]
        assert 'valid_cookie' in cookie_names
        assert 'another_valid' in cookie_names
        
        # Verify values
        valid_cookie = next(c for c in cookies if c['name'] == 'valid_cookie')
        assert valid_cookie['value'] == 'value123'
        
        another_valid = next(c for c in cookies if c['name'] == 'another_valid')
        assert another_valid['value'] == 'test'

    def test_extract_set_cookies_edge_case_attributes(self, request_instance):
        """Test _extract_set_cookies with edge case cookie attributes."""
        from pydoll.protocol.network.events import NetworkEvent
        
        # Mock event with edge case attributes
        events = [
            {
                'method': NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO,
                'params': {
                    'headers': {
                        'Set-Cookie': 'test_cookie=value; Expires=Wed, 09 Jun 2021 10:18:14 GMT; Max-Age=0; SameSite=None; Priority=High'
                    },
                    'blockedCookies': []
                }
            }
        ]
        
        request_instance._requests_received = events
        
        # Extract cookies
        cookies = request_instance._extract_set_cookies()
        
        # Should have 1 cookie (only name and value extracted)
        assert len(cookies) == 1
        cookie = cookies[0]
        
        assert cookie['name'] == 'test_cookie'
        assert cookie['value'] == 'value'
        # All attributes like expires, maxAge, sameSite, etc. are ignored by the implementation

    def test_extract_set_cookies_integration_with_filter(self, request_instance):
        """Test integration between _extract_set_cookies and _filter_response_extra_info_events."""
        from pydoll.protocol.network.events import NetworkEvent
        
        # Mock mixed events (some relevant, some not)
        events = [
            {
                'method': NetworkEvent.REQUEST_WILL_BE_SENT,
                'params': {'request': {'headers': {}}}
            },
            {
                'method': NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO,
                'params': {
                    'headers': {'Set-Cookie': 'filtered_cookie=should_be_extracted; Path=/'},
                    'blockedCookies': []
                }
            },
            {
                'method': NetworkEvent.RESPONSE_RECEIVED,
                'params': {'response': {'headers': {}}}
            },
            {
                'method': NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO,
                'params': {
                    'headers': {'Set-Cookie': 'another_cookie=also_extracted; HttpOnly'},
                    'blockedCookies': []
                }
            }
        ]
        
        request_instance._requests_received = events
        
        # Extract cookies (should use filtering internally)
        cookies = request_instance._extract_set_cookies()
        
        # Should have 2 cookies from the 2 RESPONSE_RECEIVED_EXTRA_INFO events
        assert len(cookies) == 2
        
        cookie_names = [c['name'] for c in cookies]
        assert 'filtered_cookie' in cookie_names
        assert 'another_cookie' in cookie_names

    def test_extract_set_cookies_empty_name_rejection(self, request_instance):
        """Test that _extract_set_cookies rejects cookies with empty names."""
        from pydoll.protocol.network.events import NetworkEvent
        
        # Mock event with various invalid cookie formats
        events = [
            {
                'method': NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO,
                'params': {
                    'headers': {
                        'Set-Cookie': 'valid_cookie=value\n=empty_name_value\n =space_only_name_value\n\t=tab_only_name_value'
                    },
                    'blockedCookies': []
                }
            }
        ]
        
        request_instance._requests_received = events
        
        # Extract cookies
        cookies = request_instance._extract_set_cookies()
        
        # Should only extract the valid cookie, rejecting all empty/whitespace-only names
        assert len(cookies) == 1
        assert cookies[0]['name'] == 'valid_cookie'
        assert cookies[0]['value'] == 'value'

    def test_parse_cookie_line_empty_name_validation(self, request_instance):
        """Test _parse_cookie_line directly with empty names."""
        # Test various forms of empty names
        assert request_instance._parse_cookie_line('=value') is None
        assert request_instance._parse_cookie_line(' =value') is None
        assert request_instance._parse_cookie_line('\t=value') is None
        assert request_instance._parse_cookie_line('  \t  =value') is None
        
        # Test valid names
        result = request_instance._parse_cookie_line('name=value')
        assert result is not None
        assert result['name'] == 'name'
        assert result['value'] == 'value'
        
        # Test whitespace around valid names (should be trimmed)
        result = request_instance._parse_cookie_line('  name  =  value  ')
        assert result is not None
        assert result['name'] == 'name'
        assert result['value'] == 'value'

================================================
FILE: tests/test_browser/test_requests_response.py
================================================
"""
Tests for pydoll.browser.requests.response module.
"""

import json
import pytest

from pydoll.browser.requests.response import Response, STATUS_CODE_RANGE_OK
from pydoll.exceptions import HTTPError
from pydoll.protocol.fetch.types import HeaderEntry
from pydoll.protocol.network.types import CookieParam


class TestResponseInitialization:
    """Test Response class initialization."""

    def test_response_initialization_minimal(self):
        """Test Response initialization with minimal parameters."""
        response = Response(status_code=200)
        
        assert response.status_code == 200
        assert response.content == b''
        assert response.text == ''
        assert response.headers == []
        assert response.request_headers == []
        assert response.cookies == []
        assert response.ok is True

    def test_response_initialization_full(self):
        """Test Response initialization with all parameters."""
        headers = [HeaderEntry(name='Content-Type', value='application/json')]
        request_headers = [HeaderEntry(name='User-Agent', value='Test-Agent')]
        cookies = [CookieParam(name='session', value='abc123')]
        json_data = {'message': 'success'}
        
        response = Response(
            status_code=201,
            content=b'{"message": "success"}',
            text='{"message": "success"}',
            json=json_data,
            response_headers=headers,
            request_headers=request_headers,
            cookies=cookies,
            url='https://example.com'
        )
        
        assert response.status_code == 201
        assert response.content == b'{"message": "success"}'
        assert response.text == '{"message": "success"}'
        assert response.headers == headers
        assert response.request_headers == request_headers
        assert response.cookies == cookies
        assert response.ok is True

    def test_response_initialization_with_none_values(self):
        """Test Response initialization handles None values correctly."""
        response = Response(
            status_code=200,
            response_headers=None,
            request_headers=None,
            cookies=None
        )
        
        assert response.headers == []
        assert response.request_headers == []
        assert response.cookies == []


class TestResponseProperties:
    """Test Response properties."""

    def test_ok_property_success_codes(self):
        """Test ok property returns True for success status codes."""
        success_codes = [200, 201, 204, 299, 300, 301, 302, 399]
        
        for code in success_codes:
            response = Response(status_code=code)
            assert response.ok is True, f"Status code {code} should be ok"

    def test_ok_property_error_codes(self):
        """Test ok property returns False for error status codes."""
        error_codes = [400, 401, 403, 404, 500, 502, 503]
        
        for code in error_codes:
            response = Response(status_code=code)
            assert response.ok is False, f"Status code {code} should not be ok"

    def test_status_code_property(self):
        """Test status_code property."""
        response = Response(status_code=404)
        assert response.status_code == 404

    def test_content_property(self):
        """Test content property returns bytes."""
        content = b'Hello, World!'
        response = Response(status_code=200, content=content)
        assert response.content == content
        assert isinstance(response.content, bytes)

    def test_text_property_provided(self):
        """Test text property when text is provided."""
        text = 'Hello, World!'
        response = Response(status_code=200, text=text)
        assert response.text == text

    def test_text_property_decoded_from_content(self):
        """Test text property decodes from content when not provided."""
        content = b'Hello, World!'
        response = Response(status_code=200, content=content)
        assert response.text == 'Hello, World!'

    def test_text_property_handles_encoding_errors(self):
        """Test text property handles encoding errors gracefully."""
        # Invalid UTF-8 sequence
        content = b'\xff\xfe\xfd'
        response = Response(status_code=200, content=content)
        
        # Should not raise exception and should have some text
        text = response.text
        assert isinstance(text, str)
        assert len(text) > 0

    def test_text_property_empty_content(self):
        """Test text property with empty content."""
        response = Response(status_code=200, content=b'')
        assert response.text == ''

    def test_headers_property(self):
        """Test headers property returns response headers."""
        headers = [
            HeaderEntry(name='Content-Type', value='application/json'),
            HeaderEntry(name='Content-Length', value='100')
        ]
        response = Response(status_code=200, response_headers=headers)
        assert response.headers == headers

    def test_request_headers_property(self):
        """Test request_headers property returns request headers."""
        headers = [
            HeaderEntry(name='User-Agent', value='Test-Agent'),
            HeaderEntry(name='Accept', value='application/json')
        ]
        response = Response(status_code=200, request_headers=headers)
        assert response.request_headers == headers

    def test_cookies_property(self):
        """Test cookies property returns cookies."""
        cookies = [
            CookieParam(name='session', value='abc123'),
            CookieParam(name='csrf', value='token456')
        ]
        response = Response(status_code=200, cookies=cookies)
        assert response.cookies == cookies

    def test_url_property(self):
        """Test url property returns final URL."""
        url = 'https://api.example.com/data'
        response = Response(status_code=200, url=url)
        assert response.url == url

    def test_url_property_empty(self):
        """Test url property with empty URL."""
        response = Response(status_code=200, url='')
        assert response.url == ''


class TestResponseJSONMethod:
    """Test Response json() method."""

    def test_json_method_with_provided_json(self):
        """Test json() method when JSON data is provided."""
        json_data = {'message': 'success', 'code': 200}
        response = Response(status_code=200, json=json_data)
        
        result = response.json()
        assert result == json_data

    def test_json_method_parses_from_text(self):
        """Test json() method parses JSON from text."""
        json_text = '{"message": "success", "code": 200}'
        response = Response(status_code=200, text=json_text)
        
        result = response.json()
        assert result == {'message': 'success', 'code': 200}

    def test_json_method_caches_result(self):
        """Test json() method caches parsed result."""
        json_text = '{"message": "success"}'
        response = Response(status_code=200, text=json_text)
        
        # First call should parse
        result1 = response.json()
        # Second call should return cached result
        result2 = response.json()
        
        assert result1 == result2
        assert result1 is result2  # Same object instance

    def test_json_method_invalid_json_raises_error(self):
        """Test json() method raises ValueError for invalid JSON."""
        response = Response(status_code=200, text='invalid json')
        
        with pytest.raises(ValueError, match='Response is not valid JSON'):
            response.json()

    def test_json_method_empty_text(self):
        """Test json() method with empty text."""
        response = Response(status_code=200, text='')
        
        with pytest.raises(ValueError, match='Response is not valid JSON'):
            response.json()

    def test_json_method_with_array(self):
        """Test json() method with JSON array."""
        json_text = '[{"id": 1}, {"id": 2}]'
        response = Response(status_code=200, text=json_text)
        
        result = response.json()
        assert result == [{'id': 1}, {'id': 2}]

    def test_json_method_with_primitive_values(self):
        """Test json() method with primitive JSON values."""
        test_cases = [
            ('true', True),
            ('false', False),
            ('null', None),
            ('42', 42),
            ('"string"', 'string')
        ]
        
        for json_text, expected in test_cases:
            response = Response(status_code=200, text=json_text)
            result = response.json()
            assert result == expected


class TestResponseRaiseForStatus:
    """Test Response raise_for_status() method."""

    def test_raise_for_status_success_codes(self):
        """Test raise_for_status() does not raise for success codes."""
        success_codes = [200, 201, 204, 299, 300, 301, 302, 399]
        
        for code in success_codes:
            response = Response(status_code=code, url='https://example.com')
            # Should not raise any exception
            response.raise_for_status()

    def test_raise_for_status_client_error(self):
        """Test raise_for_status() raises for client error codes."""
        error_codes = [400, 401, 403, 404, 422, 499]
        
        for code in error_codes:
            response = Response(status_code=code, url='https://example.com')
            with pytest.raises(HTTPError, match=f'{code} Client Error'):
                response.raise_for_status()

    def test_raise_for_status_server_error(self):
        """Test raise_for_status() raises for server error codes."""
        error_codes = [500, 502, 503, 504, 599]
        
        for code in error_codes:
            response = Response(status_code=code, url='https://example.com')
            with pytest.raises(HTTPError, match=f'{code} Client Error'):
                response.raise_for_status()

    def test_raise_for_status_includes_url(self):
        """Test raise_for_status() includes URL in error message."""
        url = 'https://api.example.com/endpoint'
        response = Response(status_code=404, url=url)
        
        with pytest.raises(HTTPError, match=f'for url {url}'):
            response.raise_for_status()

    def test_raise_for_status_empty_url(self):
        """Test raise_for_status() works with empty URL."""
        response = Response(status_code=500, url='')
        
        with pytest.raises(HTTPError, match='500 Client Error: for url'):
            response.raise_for_status()


class TestHTTPErrorException:
    """Test HTTPError exception class."""

    def test_http_error_creation(self):
        """Test HTTPError can be created with message."""
        error = HTTPError('Test error message')
        assert str(error) == 'Test error message'

    def test_http_error_inheritance(self):
        """Test HTTPError inherits from Exception."""
        error = HTTPError('Test error')
        assert isinstance(error, Exception)

    def test_http_error_with_format_string(self):
        """Test HTTPError with formatted message."""
        status_code = 404
        url = 'https://example.com'
        error = HTTPError(f'{status_code} Client Error: for url {url}')
        
        expected_message = '404 Client Error: for url https://example.com'
        assert str(error) == expected_message


class TestResponseEdgeCases:
    """Test Response edge cases and unusual scenarios."""

    def test_response_with_binary_content(self):
        """Test Response with binary content."""
        binary_data = bytes(range(256))  # All possible byte values
        response = Response(status_code=200, content=binary_data)
        
        assert response.content == binary_data
        assert isinstance(response.content, bytes)

    def test_response_with_unicode_text(self):
        """Test Response with Unicode text."""
        unicode_text = '🌟 Hello, 世界! 🚀'
        response = Response(status_code=200, text=unicode_text)
        
        assert response.text == unicode_text

    def test_response_text_lazy_decoding(self):
        """Test that text decoding is lazy and cached."""
        content = 'Hello, World!'.encode('utf-8')
        response = Response(status_code=200, content=content)
        
        # Access text multiple times
        text1 = response.text
        text2 = response.text
        
        assert text1 == text2
        assert text1 == 'Hello, World!'

    def test_response_with_large_content(self):
        """Test Response with large content."""
        large_content = b'x' * 1000000  # 1MB of data
        response = Response(status_code=200, content=large_content)
        
        assert len(response.content) == 1000000
        assert response.content == large_content

    def test_response_status_code_boundary_values(self):
        """Test Response with boundary status code values."""
        boundary_codes = [100, 199, 200, 299, 300, 399, 400, 499, 500, 599]
        
        for code in boundary_codes:
            response = Response(status_code=code)
            assert response.status_code == code
            
            # Check ok property boundary
            if code in STATUS_CODE_RANGE_OK:
                assert response.ok is True
            else:
                assert response.ok is False

    def test_response_with_complex_headers(self):
        """Test Response with complex header scenarios."""
        headers = [
            HeaderEntry(name='Set-Cookie', value='session=abc; Path=/'),
            HeaderEntry(name='Set-Cookie', value='csrf=xyz; HttpOnly'),
            HeaderEntry(name='Content-Type', value='application/json; charset=utf-8'),
            HeaderEntry(name='X-Custom-Header', value='custom value with spaces')
        ]
        
        response = Response(status_code=200, response_headers=headers)
        assert len(response.headers) == 4
        assert response.headers == headers

    def test_response_with_empty_json_object(self):
        """Test Response with empty JSON object."""
        response = Response(status_code=200, text='{}')
        result = response.json()
        assert result == {}

    def test_response_with_nested_json(self):
        """Test Response with deeply nested JSON."""
        nested_json = {
            'level1': {
                'level2': {
                    'level3': {
                        'data': ['item1', 'item2'],
                        'metadata': {'count': 2, 'type': 'array'}
                    }
                }
            }
        }
        
        response = Response(status_code=200, json=nested_json)
        result = response.json()
        assert result == nested_json
        assert result['level1']['level2']['level3']['data'] == ['item1', 'item2']


class TestResponseIntegration:
    """Test Response integration scenarios."""

    def test_complete_response_workflow(self):
        """Test complete response workflow with all components."""
        # Simulate a complete API response
        headers = [
            HeaderEntry(name='Content-Type', value='application/json'),
            HeaderEntry(name='Content-Length', value='45'),
            HeaderEntry(name='Server', value='nginx/1.18.0')
        ]
        
        request_headers = [
            HeaderEntry(name='User-Agent', value='PyDoll/1.0'),
            HeaderEntry(name='Accept', value='application/json'),
            HeaderEntry(name='Authorization', value='Bearer token123')
        ]
        
        cookies = [
            CookieParam(name='session_id', value='sess_abc123'),
            CookieParam(name='preferences', value='theme=dark')
        ]
        
        json_data = {
            'status': 'success',
            'data': {'id': 1, 'name': 'Test Item'},
            'timestamp': '2023-12-01T10:00:00Z'
        }
        
        response = Response(
            status_code=200,
            content=json.dumps(json_data).encode('utf-8'),
            text=json.dumps(json_data),
            json=json_data,
            response_headers=headers,
            request_headers=request_headers,
            cookies=cookies,
            url='https://api.example.com/items/1'
        )
        
        # Test all aspects
        assert response.ok is True
        assert response.status_code == 200
        assert response.json() == json_data
        assert len(response.headers) == 3
        assert len(response.request_headers) == 3
        assert len(response.cookies) == 2
        
        # Should not raise
        response.raise_for_status()

    def test_error_response_workflow(self):
        """Test error response workflow."""
        error_json = {
            'error': 'Not Found',
            'message': 'The requested resource was not found',
            'code': 404
        }
        
        response = Response(
            status_code=404,
            text=json.dumps(error_json),
            url='https://api.example.com/items/999'
        )
        
        assert response.ok is False
        assert response.status_code == 404
        assert response.json() == error_json
        
        with pytest.raises(HTTPError):
            response.raise_for_status()

================================================
FILE: tests/test_browser/test_tab_request_integration.py
================================================
"""
Integration tests for Tab and Request classes.

This module tests the integration between the Tab class and the Request class,
focusing on the 'request' property and how they work together for HTTP requests.
"""

import pytest
import pytest_asyncio
import uuid
from unittest.mock import AsyncMock, MagicMock, patch

from pydoll.browser.tab import Tab
from pydoll.browser.requests.request import Request
from pydoll.browser.requests.response import Response
from pydoll.protocol.fetch.types import HeaderEntry
from pydoll.protocol.network.types import CookieParam


@pytest_asyncio.fixture
async def mock_connection_handler():
    """Mock connection handler for Tab tests."""
    with patch('pydoll.connection.ConnectionHandler', autospec=True) as mock:
        handler = mock.return_value
        handler.execute_command = AsyncMock()
        handler.register_callback = AsyncMock()
        handler.remove_callback = AsyncMock()
        handler.clear_callbacks = AsyncMock()
        handler.network_logs = []
        handler.dialog = None
        yield handler


@pytest_asyncio.fixture
async def mock_browser():
    """Mock browser instance."""
    browser = MagicMock()
    browser.close_tab = AsyncMock()
    return browser


@pytest_asyncio.fixture
async def tab(mock_browser, mock_connection_handler):
    """Tab fixture with mocked dependencies."""
    # Generate unique target_id for each test to avoid singleton conflicts
    unique_target_id = f'test-target-{uuid.uuid4().hex[:8]}'
    
    with patch('pydoll.browser.tab.ConnectionHandler', return_value=mock_connection_handler):
        tab_instance = Tab(
            browser=mock_browser,
            connection_port=9222,
            target_id=unique_target_id,
            browser_context_id='test-context-id'
        )
        
        # Mock network events properties
        tab_instance._network_events_enabled = False
        tab_instance._page_events_enabled = False
        tab_instance._dom_events_enabled = False
        tab_instance._runtime_events_enabled = False
        tab_instance._fetch_events_enabled = False
        tab_instance._intercept_file_chooser_dialog_enabled = False
        
        yield tab_instance


@pytest_asyncio.fixture
def cleanup_tab_registry():
    """No-op: singleton removed; keep fixture for compatibility."""
    yield


class TestTabRequestProperty:
    """Test the request property on Tab class."""

    def test_request_property_lazy_initialization(self, tab):
        """Test that request property creates Request instance lazily."""
        # Initially _request should be None
        assert tab._request is None
        
        # First access should create the Request instance
        request_instance = tab.request
        assert request_instance is not None
        assert isinstance(request_instance, Request)
        assert tab._request is request_instance
        
        # Second access should return the same instance
        request_instance2 = tab.request
        assert request_instance2 is request_instance

    def test_request_property_binds_to_tab(self, tab):
        """Test that Request instance is properly bound to the Tab."""
        request_instance = tab.request
        
        # Request should have reference to the tab
        assert request_instance.tab is tab

    def test_request_property_type_annotation(self, tab):
        """Test that request property returns correct type."""
        request_instance = tab.request
        assert isinstance(request_instance, Request)

    def test_multiple_tabs_have_separate_requests(self, mock_browser, mock_connection_handler):
        """Test that different Tab instances have separate Request instances."""
        # Create two different tabs
        with patch('pydoll.browser.tab.ConnectionHandler', return_value=mock_connection_handler):
            tab1 = Tab(
                browser=mock_browser,
                connection_port=9222,
                target_id="test-target-1",
                browser_context_id='test-context-1'
            )
            
            tab2 = Tab(
                browser=mock_browser,
                connection_port=9222,
                target_id="test-target-2",
                browser_context_id='test-context-2'
            )
            
            # Each tab should have its own Request instance
            request1 = tab1.request
            request2 = tab2.request
            
            assert request1 is not request2
            assert request1.tab is tab1
            assert request2.tab is tab2


class TestTabRequestIntegration:
    """Test integration scenarios between Tab and Request."""

    @pytest.mark.asyncio
    async def test_request_uses_tab_network_events(self, tab):
        """Test that Request properly uses Tab's network event system."""
        request_instance = tab.request
        
        # Mock network events methods
        tab.enable_network_events = AsyncMock()
        tab.disable_network_events = AsyncMock()
        tab.on = AsyncMock(side_effect=lambda *a, **kw: len(tab.on.call_args_list))
        tab.remove_callback = AsyncMock()

        # Mock tab execute command for HTTP request
        tab._execute_command = AsyncMock()
        mock_result = {
            'result': {
                'result': {
                    'value': {
                        'status': 200,
                        'content': [72, 101, 108, 108, 111],  # "Hello" as bytes
                        'text': 'Hello',
                        'json': {'message': 'success'},
                        'url': 'https://example.com'
                    }
                }
            }
        }
        tab._execute_command.return_value = mock_result
        
        # Mock helper methods to avoid actual network processing
        with patch.object(request_instance, '_extract_received_headers') as mock_extract_headers, \
             patch.object(request_instance, '_extract_sent_headers') as mock_extract_sent, \
             patch.object(request_instance, '_extract_set_cookies') as mock_extract_cookies:
            
            mock_extract_headers.return_value = [HeaderEntry(name='Content-Type', value='application/json')]
            mock_extract_sent.return_value = [HeaderEntry(name='User-Agent', value='Test-Agent')]
            mock_extract_cookies.return_value = [CookieParam(name='session', value='abc123')]
            
            # Make a request
            response = await request_instance.get('https://example.com')
            
            # Verify response
            assert isinstance(response, Response)
            assert response.status_code == 200
            assert response.text == 'Hello'
            
            # Verify that tab's execute_command was called
            tab._execute_command.assert_called_once()

    @pytest.mark.asyncio
    async def test_request_enables_network_events_when_needed(self, tab):
        """Test that Request enables network events on tab when not already enabled."""
        request_instance = tab.request
        
        # Tab initially has network events disabled
        tab._network_events_enabled = False
        tab.enable_network_events = AsyncMock()
        tab.disable_network_events = AsyncMock()
        tab.on = AsyncMock(side_effect=lambda *a, **kw: len(tab.on.call_args_list))
        tab.remove_callback = AsyncMock()

        # Mock tab execute command
        tab._execute_command = AsyncMock()
        mock_result = {
            'result': {
                'result': {
                    'value': {
                        'status': 200,
                        'content': [],
                        'text': 'OK',
                        'json': None,
                        'url': 'https://example.com'
                    }
                }
            }
        }
        tab._execute_command.return_value = mock_result

        # Mock helper methods
        with patch.object(request_instance, '_extract_received_headers') as mock_extract_headers, \
             patch.object(request_instance, '_extract_sent_headers') as mock_extract_sent, \
             patch.object(request_instance, '_extract_set_cookies') as mock_extract_cookies:

            mock_extract_headers.return_value = []
            mock_extract_sent.return_value = []
            mock_extract_cookies.return_value = []

            # Make a request
            await request_instance.get('https://example.com')

            # Verify network events were enabled and callbacks were registered
            tab.enable_network_events.assert_called_once()
            assert tab.on.call_count == 4  # Four network events should be registered

    @pytest.mark.asyncio
    async def test_request_clears_callbacks_after_completion(self, tab):
        """Test that Request clears callbacks after request completion."""
        request_instance = tab.request
        
        # Mock tab methods
        tab._network_events_enabled = False
        tab.enable_network_events = AsyncMock()
        tab.disable_network_events = AsyncMock()
        tab.on = AsyncMock(side_effect=lambda *a, **kw: len(tab.on.call_args_list))
        tab.remove_callback = AsyncMock()
        tab._execute_command = AsyncMock()

        mock_result = {
            'result': {
                'result': {
                    'value': {
                        'status': 200,
                        'content': [],
                        'text': 'OK',
                        'json': None,
                        'url': 'https://example.com'
                    }
                }
            }
        }
        tab._execute_command.return_value = mock_result

        # Mock helper methods
        with patch.object(request_instance, '_extract_received_headers') as mock_extract_headers, \
             patch.object(request_instance, '_extract_sent_headers') as mock_extract_sent, \
             patch.object(request_instance, '_extract_set_cookies') as mock_extract_cookies:

            mock_extract_headers.return_value = []
            mock_extract_sent.return_value = []
            mock_extract_cookies.return_value = []

            # Make a request
            await request_instance.get('https://example.com')

            # Verify callbacks were removed surgically (4 callbacks registered)
            assert tab.remove_callback.call_count == 4

    @pytest.mark.asyncio
    async def test_request_clears_callbacks_on_error(self, tab):
        """Test that Request clears callbacks even when request fails."""
        request_instance = tab.request
        
        # Mock tab methods
        tab._network_events_enabled = False
        tab.enable_network_events = AsyncMock()
        tab.disable_network_events = AsyncMock()
        tab.on = AsyncMock(side_effect=lambda *a, **kw: len(tab.on.call_args_list))
        tab.remove_callback = AsyncMock()

        # Make tab._execute_command raise an exception
        tab._execute_command = AsyncMock(side_effect=Exception("Network error"))

        # Make a request that should fail
        with pytest.raises(Exception):  # Should raise HTTPError wrapping the original exception
            await request_instance.get('https://example.com')

        # Verify callbacks were still removed despite the error
        assert tab.remove_callback.call_count == 4

    @pytest.mark.asyncio
    async def test_request_http_methods_integration(self, tab):
        """Test that all HTTP methods work through the Tab's request property."""
        request_instance = tab.request
        
        # Mock tab methods
        tab._network_events_enabled = False
        tab.enable_network_events = AsyncMock()
        tab.disable_network_events = AsyncMock()
        tab.on = AsyncMock(side_effect=lambda *a, **kw: len(tab.on.call_args_list))
        tab.remove_callback = AsyncMock()
        tab._execute_command = AsyncMock()

        mock_result = {
            'result': {
                'result': {
                    'value': {
                        'status': 200,
                        'content': [],
                        'text': 'OK',
                        'json': None,
                        'url': 'https://example.com'
                    }
                }
            }
        }
        tab._execute_command.return_value = mock_result

        # Mock helper methods
        with patch.object(request_instance, '_extract_received_headers') as mock_extract_headers, \
             patch.object(request_instance, '_extract_sent_headers') as mock_extract_sent, \
             patch.object(request_instance, '_extract_set_cookies') as mock_extract_cookies:

            mock_extract_headers.return_value = []
            mock_extract_sent.return_value = []
            mock_extract_cookies.return_value = []

            # Test all HTTP methods
            methods_to_test = [
                ('get', lambda: request_instance.get('https://example.com')),
                ('post', lambda: request_instance.post('https://example.com', data={'key': 'value'})),
                ('put', lambda: request_instance.put('https://example.com', json={'update': True})),
                ('patch', lambda: request_instance.patch('https://example.com', json={'patch': True})),
                ('delete', lambda: request_instance.delete('https://example.com')),
                ('head', lambda: request_instance.head('https://example.com')),
                ('options', lambda: request_instance.options('https://example.com')),
            ]

            for method_name, method_call in methods_to_test:
                # Reset mocks
                tab._execute_command.reset_mock()
                tab.remove_callback.reset_mock()

                # Execute method
                response = await method_call()

                # Verify response
                assert isinstance(response, Response)
                assert response.status_code == 200

                # Verify tab's execute_command was called
                tab._execute_command.assert_called_once()
                # Verify callbacks were removed surgically (4 per request)
                assert tab.remove_callback.call_count == 4

    def test_request_property_singleton_behavior(self, tab):
        """Test that request property maintains singleton behavior per tab."""
        # Multiple accesses should return the same instance
        request1 = tab.request
        request2 = tab.request
        request3 = tab.request
        
        assert request1 is request2
        assert request2 is request3
        assert isinstance(request1, Request)

    @pytest.mark.asyncio
    async def test_tab_request_maintains_state(self, tab):
        """Test that Tab's request instance maintains its state across calls."""
        request_instance = tab.request
        
        # Simulate some state changes in the request instance
        request_instance._network_events_enabled = True
        request_instance._requests_sent = ['mock_request']
        request_instance._requests_received = ['mock_response']
        
        # Access request property again
        same_request = tab.request
        
        # Should be the same instance with preserved state
        assert same_request is request_instance
        assert same_request._network_events_enabled is True
        assert same_request._requests_sent == ['mock_request']
        assert same_request._requests_received == ['mock_response']


class TestTabRequestEdgeCases:
    """Test edge cases for Tab-Request integration."""

    def test_request_property_after_tab_reuse(self, mock_browser, mock_connection_handler):
        """Test request property behavior when Tab instances are reused."""
        # Create tab with specific target_id
        target_id = "reusable-target-123"
        
        with patch('pydoll.browser.tab.ConnectionHandler', return_value=mock_connection_handler):
            # First tab instance
            tab1 = Tab(
                browser=mock_browser,
                connection_port=9222,
                target_id=target_id,
                browser_context_id='test-context-reuse'
            )
            request1 = tab1.request
            
            # Second tab instance with same target_id (no singleton anymore)
            tab2 = Tab(
                browser=mock_browser,
                connection_port=9222,
                target_id=target_id,
                browser_context_id='test-context-reuse'
            )
            # With no singleton, they are different instances, but independent request is allowed
            assert tab2 is not tab1
            # Request instances are created per tab; they are distinct here
            request2 = tab2.request
            assert request2 is not request1

    @pytest.mark.asyncio
    async def test_request_property_memory_efficiency(self, tab):
        """Test that request property doesn't create unnecessary instances."""
        import weakref
        
        # Get initial request instance
        request_instance = tab.request
        weak_ref = weakref.ref(request_instance)
        
        # Clear local reference
        del request_instance
        
        # Request instance should still exist because tab holds reference
        assert weak_ref() is not None
        
        # Getting request again should return same instance
        same_request = tab.request
        assert weak_ref() is same_request

    def test_request_property_with_different_tab_states(self, mock_browser, mock_connection_handler):
        """Test request property with tabs in different states."""
        # Create tabs with different configurations
        tab_configurations = [
            {'target_id': 'tab-1', 'browser_context_id': 'context-1'},
            {'target_id': 'tab-2', 'browser_context_id': 'context-2'},
            {'target_id': 'tab-3', 'browser_context_id': 'context-3'},
        ]
        
        tabs_and_requests = []
        
        with patch('pydoll.browser.tab.ConnectionHandler', return_value=mock_connection_handler):
            for config in tab_configurations:
                tab = Tab(
                    browser=mock_browser,
                    connection_port=9222,
                    **config
                )
                request = tab.request
                tabs_and_requests.append((tab, request))
        
        # Each tab should have its own request instance
        for i, (tab, request) in enumerate(tabs_and_requests):
            assert isinstance(request, Request)
            assert request.tab is tab
            
            # Compare with other tabs
            for j, (other_tab, other_request) in enumerate(tabs_and_requests):
                if i != j:
                    assert request is not other_request
                    assert tab is not other_tab

================================================
FILE: tests/test_click_nested_integration.py
================================================
"""Integration tests for click() on nested elements (shadow DOM, iframes)."""

import asyncio
from pathlib import Path

import pytest

from pydoll.browser.chromium import Chrome
from pydoll.elements.web_element import WebElement

TEST_PAGE = f'file://{(Path(__file__).parent / "pages" / "test_click_nested.html").absolute()}'


class TestClickRegularElement:
    """Baseline: click() on a normal page element."""

    @pytest.mark.asyncio
    async def test_click_regular_button(self, ci_chrome_options):
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(TEST_PAGE)
            await asyncio.sleep(0.5)

            btn = await tab.find(id='regular-btn')
            counter = await tab.find(id='regular-btn-count')

            text_before = await counter.text
            assert text_before == '0'

            await btn.click()
            await asyncio.sleep(0.2)

            text_after = await counter.text
            assert text_after == '1'

    @pytest.mark.asyncio
    async def test_click_regular_button_multiple_times(self, ci_chrome_options):
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(TEST_PAGE)
            await asyncio.sleep(0.5)

            btn = await tab.find(id='regular-btn')
            counter = await tab.find(id='regular-btn-count')

            for i in range(3):
                await btn.click()
                await asyncio.sleep(0.15)

            text = await counter.text
            assert text == '3'


class TestClickInShadowRoot:
    """click() on elements inside a shadow root."""

    @pytest.mark.asyncio
    async def test_click_button_in_shadow_root(self, ci_chrome_options):
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(TEST_PAGE)
            await asyncio.sleep(0.5)

            host = await tab.find(id='shadow-host')
            shadow = await host.get_shadow_root()

            btn = await shadow.query('#shadow-btn')
            counter = await shadow.query('#shadow-btn-count')

            text_before = await counter.text
            assert text_before == '0'

            await btn.click()
            await asyncio.sleep(0.2)

            text_after = await counter.text
            assert text_after == '1'

    @pytest.mark.asyncio
    async def test_find_text_in_shadow_root(self, ci_chrome_options):
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(TEST_PAGE)
            await asyncio.sleep(0.5)

            host = await tab.find(id='shadow-host')
            shadow = await host.get_shadow_root()

            text_el = await shadow.query('.shadow-text')
            assert isinstance(text_el, WebElement)
            text = await text_el.text
            assert text == 'Content inside shadow root'


class TestClickInNestedShadowRoots:
    """click() on elements inside nested shadow roots (outer open -> inner closed)."""

    @pytest.mark.asyncio
    async def test_click_button_in_nested_shadow(self, ci_chrome_options):
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(TEST_PAGE)
            await asyncio.sleep(0.5)

            outer_host = await tab.find(id='nested-shadow-host')
            outer_shadow = await outer_host.get_shadow_root()

            inner_host = await outer_shadow.query('#inner-shadow-host')
            inner_shadow = await inner_host.get_shadow_root()

            btn = await inner_shadow.query('#deep-btn')
            counter = await inner_shadow.query('#deep-btn-count')

            text_before = await counter.text
            assert text_before == '0'

            await btn.click()
            await asyncio.sleep(0.2)

            text_after = await counter.text
            assert text_after == '1'

    @pytest.mark.asyncio
    async def test_find_text_in_nested_shadow(self, ci_chrome_options):
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(TEST_PAGE)
            await asyncio.sleep(0.5)

            outer_host = await tab.find(id='nested-shadow-host')
            outer_shadow = await outer_host.get_shadow_root()

            outer_text = await outer_shadow.query('.outer-text')
            assert 'Outer shadow content' == await outer_text.text

            inner_host = await outer_shadow.query('#inner-shadow-host')
            inner_shadow = await inner_host.get_shadow_root()

            inner_text = await inner_shadow.query('.inner-text')
            assert 'Inner shadow content' == await inner_text.text


class TestClickInIframe:
    """click() on elements inside an iframe."""

    @pytest.mark.asyncio
    async def test_click_button_in_iframe(self, ci_chrome_options):
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(TEST_PAGE)
            await asyncio.sleep(1)

            iframe = await tab.find(id='test-iframe')
            assert iframe.is_iframe

            btn = await iframe.find(id='iframe-btn')
            counter = await iframe.find(id='iframe-btn-count')

            text_before = await counter.text
            assert text_before == '0'

            await btn.click()
            await asyncio.sleep(0.3)

            text_after = await counter.text
            assert text_after == '1'


class TestClickInShadowRootInsideIframe:
    """click() on elements in a shadow root that lives inside an iframe."""

    @pytest.mark.asyncio
    async def test_click_shadow_button_inside_iframe(self, ci_chrome_options):
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(TEST_PAGE)
            await asyncio.sleep(1)

            iframe = await tab.find(id='test-iframe')
            shadow_host = await iframe.find(id='shadow-host-in-iframe')
            shadow = await shadow_host.get_shadow_root()

            btn = await shadow.query('#shadow-btn-in-iframe')
            counter = await shadow.query('#shadow-btn-count')

            text_before = await counter.text
            assert text_before == '0'

            await btn.click()
            await asyncio.sleep(0.3)

            text_after = await counter.text
            assert text_after == '1'

    @pytest.mark.asyncio
    async def test_find_text_in_shadow_inside_iframe(self, ci_chrome_options):
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(TEST_PAGE)
            await asyncio.sleep(1)

            iframe = await tab.find(id='test-iframe')
            shadow_host = await iframe.find(id='shadow-host-in-iframe')
            shadow = await shadow_host.get_shadow_root()

            text_el = await shadow.query('.shadow-text')
            text = await text_el.text
            assert text == 'Shadow content inside iframe'


================================================
FILE: tests/test_commands/test_browser_commands.py
================================================
from pydoll.commands.browser_commands import BrowserCommands
from pydoll.protocol.browser.methods import BrowserMethod
from pydoll.protocol.browser.types import (
    WindowState, 
    PermissionType, 
    DownloadBehavior,
    BrowserCommandId,
    PermissionDescriptor,
    PermissionSetting,
    PrivacySandboxAPI
)


def test_get_version():
    """Test get_version command generation."""
    command = BrowserCommands.get_version()
    
    assert command['method'] == BrowserMethod.GET_VERSION
    assert 'params' not in command


def test_reset_permissions_without_context():
    """Test reset_permissions command without browser context."""
    command = BrowserCommands.reset_permissions()
    
    assert command['method'] == BrowserMethod.RESET_PERMISSIONS
    assert command['params'] == {}


def test_reset_permissions_with_context():
    """Test reset_permissions command with browser context."""
    browser_context_id = "test-context-123"
    command = BrowserCommands.reset_permissions(browser_context_id=browser_context_id)
    
    assert command['method'] == BrowserMethod.RESET_PERMISSIONS
    assert command['params']['browserContextId'] == browser_context_id


def test_cancel_download_minimal():
    """Test cancel_download command with minimal parameters."""
    guid = "download-guid-123"
    command = BrowserCommands.cancel_download(guid=guid)
    
    assert command['method'] == BrowserMethod.CANCEL_DOWNLOAD
    assert command['params']['guid'] == guid
    assert 'browserContextId' not in command['params']


def test_cancel_download_with_context():
    """Test cancel_download command with browser context."""
    guid = "download-guid-456"
    browser_context_id = "test-context-456"
    command = BrowserCommands.cancel_download(
        guid=guid, 
        browser_context_id=browser_context_id
    )
    
    assert command['method'] == BrowserMethod.CANCEL_DOWNLOAD
    assert command['params']['guid'] == guid
    assert command['params']['browserContextId'] == browser_context_id


def test_crash():
    """Test crash command generation."""
    command = BrowserCommands.crash()
    
    assert command['method'] == BrowserMethod.CRASH
    assert 'params' not in command


def test_crash_gpu_process():
    """Test crash_gpu_process command generation."""
    command = BrowserCommands.crash_gpu_process()
    
    assert command['method'] == BrowserMethod.CRASH_GPU_PROCESS
    assert 'params' not in command


def test_set_download_behavior_minimal():
    """Test set_download_behavior with minimal parameters."""
    behavior = DownloadBehavior.ALLOW
    command = BrowserCommands.set_download_behavior(
        behavior=behavior,
        events_enabled=True,
    )
    
    assert command['method'] == BrowserMethod.SET_DOWNLOAD_BEHAVIOR
    assert command['params']['behavior'] == behavior
    assert command['params']['eventsEnabled'] is True
    assert 'downloadPath' not in command['params']
    assert 'browserContextId' not in command['params']


def test_set_download_behavior_with_path():
    """Test set_download_behavior with download path."""
    behavior = DownloadBehavior.ALLOW
    download_path = "/path/to/downloads"
    command = BrowserCommands.set_download_behavior(
        behavior=behavior,
        download_path=download_path,
        events_enabled=True,
    )
    
    assert command['method'] == BrowserMethod.SET_DOWNLOAD_BEHAVIOR
    assert command['params']['behavior'] == behavior
    assert command['params']['downloadPath'] == download_path
    assert command['params']['eventsEnabled'] is True


def test_set_download_behavior_full_params():
    """Test set_download_behavior with all parameters."""
    behavior = DownloadBehavior.ALLOW_AND_NAME
    download_path = "/custom/download/path"
    browser_context_id = "context-789"
    events_enabled = False
    
    command = BrowserCommands.set_download_behavior(
        behavior=behavior,
        download_path=download_path,
        browser_context_id=browser_context_id,
        events_enabled=events_enabled
    )
    
    assert command['method'] == BrowserMethod.SET_DOWNLOAD_BEHAVIOR
    assert command['params']['behavior'] == behavior
    assert command['params']['downloadPath'] == download_path
    assert command['params']['browserContextId'] == browser_context_id


def test_set_download_behavior_default_behavior():
    """Test set_download_behavior with DEFAULT behavior."""
    behavior = DownloadBehavior.DEFAULT
    command = BrowserCommands.set_download_behavior(behavior=behavior)
    
    assert command['method'] == BrowserMethod.SET_DOWNLOAD_BEHAVIOR
    assert command['params']['behavior'] == behavior


def test_close():
    """Test close command generation."""
    command = BrowserCommands.close()
    
    assert command['method'] == BrowserMethod.CLOSE
    assert 'params' not in command


def test_get_window_for_target():
    """Test get_window_for_target command generation."""
    target_id = "target-123"
    command = BrowserCommands.get_window_for_target(target_id=target_id)
    
    assert command['method'] == BrowserMethod.GET_WINDOW_FOR_TARGET
    assert command['params']['targetId'] == target_id


def test_set_window_bounds():
    """Test set_window_bounds command generation."""
    window_id = 42
    bounds = {
        'width': 1920,
        'height': 1080,
        'x': 100,
        'y': 50,
        'windowState': WindowState.NORMAL
    }
    command = BrowserCommands.set_window_bounds(window_id=window_id, bounds=bounds)
    
    assert command['method'] == BrowserMethod.SET_WINDOW_BOUNDS
    assert command['params']['windowId'] == window_id
    assert command['params']['bounds'] == bounds


def test_set_window_bounds_minimal():
    """Test set_window_bounds with minimal bounds."""
    window_id = 1
    bounds = {'windowState': WindowState.MAXIMIZED}
    command = BrowserCommands.set_window_bounds(window_id=window_id, bounds=bounds)
    
    assert command['method'] == BrowserMethod.SET_WINDOW_BOUNDS
    assert command['params']['windowId'] == window_id
    assert command['params']['bounds'] == bounds


def test_set_window_maximized():
    """Test set_window_maximized command generation."""
    window_id = 5
    command = BrowserCommands.set_window_maximized(window_id=window_id)
    
    assert command['method'] == BrowserMethod.SET_WINDOW_BOUNDS
    assert command['params']['windowId'] == window_id
    assert command['params']['bounds']['windowState'] == WindowState.MAXIMIZED


def test_set_window_minimized():
    """Test set_window_minimized command generation."""
    window_id = 10
    command = BrowserCommands.set_window_minimized(window_id=window_id)
    assert command['method'] == BrowserMethod.SET_WINDOW_BOUNDS
    assert command['params']['windowId'] == window_id
    assert command['params']['bounds']['windowState'] == WindowState.MINIMIZED


def test_grant_permissions_minimal():
    """Test grant_permissions with minimal parameters."""
    permissions = [PermissionType.GEOLOCATION, PermissionType.NOTIFICATIONS]
    command = BrowserCommands.grant_permissions(permissions=permissions)
    
    assert command['method'] == BrowserMethod.GRANT_PERMISSIONS
    assert command['params']['permissions'] == permissions
    assert 'origin' not in command['params']
    assert 'browserContextId' not in command['params']


def test_grant_permissions_with_origin():
    """Test grant_permissions with origin."""
    permissions = [PermissionType.DISPLAY_CAPTURE]
    origin = "https://example.com"
    command = BrowserCommands.grant_permissions(
        permissions=permissions,
        origin=origin
    )
    
    assert command['method'] == BrowserMethod.GRANT_PERMISSIONS
    assert command['params']['permissions'] == permissions
    assert command['params']['origin'] == origin
    assert 'browserContextId' not in command['params']


def test_grant_permissions_full_params():
    """Test grant_permissions with all parameters."""
    permissions = [PermissionType.MIDI, PermissionType.CLIPBOARD_READ_WRITE]
    origin = "https://test.example.com"
    browser_context_id = "context-permissions"
    
    command = BrowserCommands.grant_permissions(
        permissions=permissions,
        origin=origin,
        browser_context_id=browser_context_id
    )
    
    assert command['method'] == BrowserMethod.GRANT_PERMISSIONS
    assert command['params']['permissions'] == permissions
    assert command['params']['origin'] == origin
    assert command['params']['browserContextId'] == browser_context_id


def test_grant_permissions_single_permission():
    """Test grant_permissions with single permission."""
    permissions = [PermissionType.PAYMENT_HANDLER]
    command = BrowserCommands.grant_permissions(permissions=permissions)
    
    assert command['method'] == BrowserMethod.GRANT_PERMISSIONS
    assert command['params']['permissions'] == permissions


def test_grant_permissions_multiple_permissions():
    """Test grant_permissions with multiple permissions."""
    permissions = [
        PermissionType.GEOLOCATION,
        PermissionType.NOTIFICATIONS,
        PermissionType.MIDI
    ]
    command = BrowserCommands.grant_permissions(permissions=permissions)
    
    assert command['method'] == BrowserMethod.GRANT_PERMISSIONS
    assert command['params']['permissions'] == permissions


def test_grant_permissions_empty_list():
    """Test grant_permissions with empty permissions list."""
    permissions = []
    command = BrowserCommands.grant_permissions(permissions=permissions)
    
    assert command['method'] == BrowserMethod.GRANT_PERMISSIONS
    assert command['params']['permissions'] == permissions


# Edge cases and additional coverage tests

def test_window_bounds_with_all_states():
    """Test window bounds with all possible window states."""
    window_id = 1
    
    # Test NORMAL state
    bounds_normal = {'windowState': WindowState.NORMAL}
    command_normal = BrowserCommands.set_window_bounds(window_id, bounds_normal)
    assert command_normal['params']['bounds']['windowState'] == WindowState.NORMAL
    
    # Test MAXIMIZED state
    bounds_max = {'windowState': WindowState.MAXIMIZED}
    command_max = BrowserCommands.set_window_bounds(window_id, bounds_max)
    assert command_max['params']['bounds']['windowState'] == WindowState.MAXIMIZED
    
    # Test MINIMIZED state
    bounds_min = {'windowState': WindowState.MINIMIZED}
    command_min = BrowserCommands.set_window_bounds(window_id, bounds_min)
    assert command_min['params']['bounds']['windowState'] == WindowState.MINIMIZED


def test_download_behaviors():
    """Test all download behavior types."""
    # Test ALLOW
    command_allow = BrowserCommands.set_download_behavior(DownloadBehavior.ALLOW)
    assert command_allow['params']['behavior'] == DownloadBehavior.ALLOW
    
    # Test ALLOW_AND_NAME
    command_allow_name = BrowserCommands.set_download_behavior(DownloadBehavior.ALLOW_AND_NAME)
    assert command_allow_name['params']['behavior'] == DownloadBehavior.ALLOW_AND_NAME
    
    # Test DEFAULT
    command_default = BrowserCommands.set_download_behavior(DownloadBehavior.DEFAULT)
    assert command_default['params']['behavior'] == DownloadBehavior.DEFAULT


def test_events_enabled_variations():
    """Test set_download_behavior with different events_enabled values."""
    behavior = DownloadBehavior.ALLOW
    
    # Test with events_enabled=True (default)
    command_true = BrowserCommands.set_download_behavior(behavior, events_enabled=True)
    assert command_true['params']['eventsEnabled'] is True
    
    # Test with events_enabled=False
    command_false = BrowserCommands.set_download_behavior(behavior, events_enabled=False)
    assert command_false['params'] == {'behavior': behavior, 'eventsEnabled': False}


def test_various_permission_types():
    """Test grant_permissions with various permission types."""
    # Test web-related permissions
    web_permissions = [
        PermissionType.GEOLOCATION,
        PermissionType.NOTIFICATIONS,
    ]
    command_web = BrowserCommands.grant_permissions(web_permissions)
    assert command_web['params']['permissions'] == web_permissions

    # Test storage permissions
    storage_permissions = [
        PermissionType.DURABLE_STORAGE,
        PermissionType.STORAGE_ACCESS
    ]
    command_storage = BrowserCommands.grant_permissions(storage_permissions)
    assert command_storage['params']['permissions'] == storage_permissions


# Tests for new/missing methods

def test_get_browser_command_line():
    """Test get_browser_command_line command generation."""
    command = BrowserCommands.get_browser_command_line()
    
    assert command['method'] == BrowserMethod.GET_BROWSER_COMMAND_LINE
    assert 'params' not in command


def test_get_histograms_minimal():
    """Test get_histograms with minimal parameters."""
    command = BrowserCommands.get_histograms()
    
    assert command['method'] == BrowserMethod.GET_HISTOGRAMS
    assert command['params'] == {}


def test_get_histograms_with_query():
    """Test get_histograms with query parameter."""
    query = "Memory"
    command = BrowserCommands.get_histograms(query=query)
    
    assert command['method'] == BrowserMethod.GET_HISTOGRAMS
    assert command['params']['query'] == query
    assert 'delta' not in command['params']


def test_get_histograms_with_delta():
    """Test get_histograms with delta parameter."""
    command = BrowserCommands.get_histograms(delta=True)
    
    assert command['method'] == BrowserMethod.GET_HISTOGRAMS
    assert command['params']['delta'] is True
    assert 'query' not in command['params']


def test_get_histograms_with_all_params():
    """Test get_histograms with all parameters."""
    query = "Network"
    delta = True
    command = BrowserCommands.get_histograms(query=query, delta=delta)
    
    assert command['method'] == BrowserMethod.GET_HISTOGRAMS
    assert command['params']['query'] == query
    assert command['params']['delta'] == delta


def test_get_histogram_minimal():
    """Test get_histogram with minimal parameters."""
    name = "Memory.Browser.TotalPMF"
    command = BrowserCommands.get_histogram(name=name)
    
    assert command['method'] == BrowserMethod.GET_HISTOGRAM
    assert command['params']['name'] == name
    assert 'delta' not in command['params']


def test_get_histogram_with_delta():
    """Test get_histogram with delta parameter."""
    name = "PageLoad.Timing.NavigationStart"
    delta = True
    command = BrowserCommands.get_histogram(name=name, delta=delta)
    
    assert command['method'] == BrowserMethod.GET_HISTOGRAM
    assert command['params']['name'] == name
    assert command['params']['delta'] == delta


def test_get_window_bounds():
    """Test get_window_bounds command generation."""
    window_id = 42
    command = BrowserCommands.get_window_bounds(window_id=window_id)
    
    assert command['method'] == BrowserMethod.GET_WINDOW_BOUNDS
    assert command['params']['windowId'] == window_id


def test_set_contents_size_with_width_only():
    """Test set_contents_size with width only."""
    window_id = 1
    width = 1920
    command = BrowserCommands.set_contents_size(window_id=window_id, width=width)
    
    assert command['method'] == BrowserMethod.SET_CONTENTS_SIZE
    assert command['params']['windowId'] == window_id
    assert command['params']['width'] == width
    assert 'height' not in command['params']


def test_set_contents_size_with_height_only():
    """Test set_contents_size with height only."""
    window_id = 2
    height = 1080
    command = BrowserCommands.set_contents_size(window_id=window_id, height=height)
    
    assert command['method'] == BrowserMethod.SET_CONTENTS_SIZE
    assert command['params']['windowId'] == window_id
    assert command['params']['height'] == height
    assert 'width' not in command['params']


def test_set_contents_size_with_both_dimensions():
    """Test set_contents_size with both width and height."""
    window_id = 3
    width = 1600
    height = 900
    command = BrowserCommands.set_contents_size(
        window_id=window_id, 
        width=width, 
        height=height
    )
    
    assert command['method'] == BrowserMethod.SET_CONTENTS_SIZE
    assert command['params']['windowId'] == window_id
    assert command['params']['width'] == width
    assert command['params']['height'] == height


def test_set_dock_tile_minimal():
    """Test set_dock_tile with no parameters."""
    command = BrowserCommands.set_dock_tile()
    
    assert command['method'] == BrowserMethod.SET_DOCK_TILE
    assert command['params'] == {}


def test_set_dock_tile_with_badge_label():
    """Test set_dock_tile with badge label."""
    badge_label = "5"
    command = BrowserCommands.set_dock_tile(badge_label=badge_label)
    
    assert command['method'] == BrowserMethod.SET_DOCK_TILE
    assert command['params']['badgeLabel'] == badge_label
    assert 'image' not in command['params']


def test_set_dock_tile_with_image():
    """Test set_dock_tile with image."""
    image = "iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAADUlEQVR42mNkYPhfDwAChAGAz"
    command = BrowserCommands.set_dock_tile(image=image)
    
    assert command['method'] == BrowserMethod.SET_DOCK_TILE
    assert command['params']['image'] == image
    assert 'badgeLabel' not in command['params']


def test_set_dock_tile_with_all_params():
    """Test set_dock_tile with all parameters."""
    badge_label = "3"
    image = "base64encodedimage"
    command = BrowserCommands.set_dock_tile(badge_label=badge_label, image=image)
    
    assert command['method'] == BrowserMethod.SET_DOCK_TILE
    assert command['params']['badgeLabel'] == badge_label
    assert command['params']['image'] == image


def test_execute_browser_command():
    """Test execute_browser_command command generation."""
    command_id = BrowserCommandId.OPEN_TAB_SEARCH
    command = BrowserCommands.execute_browser_command(command_id=command_id)
    
    assert command['method'] == BrowserMethod.EXECUTE_BROWSER_COMMAND
    assert command['params']['commandId'] == command_id


def test_add_privacy_sandbox_enrollment_override():
    """Test add_privacy_sandbox_enrollment_override command generation."""
    url = "https://example.test"
    command = BrowserCommands.add_privacy_sandbox_enrollment_override(url=url)
    
    assert command['method'] == BrowserMethod.ADD_PRIVACY_SANDBOX_ENROLLMENT_OVERRIDE
    assert command['params']['url'] == url


def test_add_privacy_sandbox_coordinator_key_config_minimal():
    """Test add_privacy_sandbox_coordinator_key_config with minimal parameters."""
    api = PrivacySandboxAPI.BIDDING_AND_AUCTION_SERVICES
    coordinator_origin = "https://coordinator.test"
    key_config = "test-key-config"
    
    command = BrowserCommands.add_privacy_sandbox_coordinator_key_config(
        api=api,
        coordinator_origin=coordinator_origin,
        key_config=key_config
    )
    
    assert command['method'] == BrowserMethod.ADD_PRIVACY_SANDBOX_COORDINATOR_KEY_CONFIG
    assert command['params']['api'] == api
    assert command['params']['coordinatorOrigin'] == coordinator_origin
    assert command['params']['keyConfig'] == key_config
    assert 'browserContextId' not in command['params']


def test_add_privacy_sandbox_coordinator_key_config_with_context():
    """Test add_privacy_sandbox_coordinator_key_config with browser context."""
    api = PrivacySandboxAPI.TRUSTED_KEY_VALUE
    coordinator_origin = "https://sandbox.test" 
    key_config = "config-data"
    browser_context_id = "test-context"
    
    command = BrowserCommands.add_privacy_sandbox_coordinator_key_config(
        api=api,
        coordinator_origin=coordinator_origin,
        key_config=key_config,
        browser_context_id=browser_context_id
    )
    
    assert command['method'] == BrowserMethod.ADD_PRIVACY_SANDBOX_COORDINATOR_KEY_CONFIG
    assert command['params']['api'] == api
    assert command['params']['coordinatorOrigin'] == coordinator_origin
    assert command['params']['keyConfig'] == key_config
    assert command['params']['browserContextId'] == browser_context_id


def test_set_permission_minimal():
    """Test set_permission with minimal parameters."""
    permission = PermissionDescriptor(name=PermissionType.GEOLOCATION)
    setting = PermissionSetting.GRANTED
    
    command = BrowserCommands.set_permission(
        permission=permission,
        setting=setting
    )
    
    assert command['method'] == BrowserMethod.SET_PERMISSION
    assert command['params']['permission'] == permission
    assert command['params']['setting'] == setting
    assert 'origin' not in command['params']
    assert 'browserContextId' not in command['params']


def test_set_permission_with_origin():
    """Test set_permission with origin."""
    permission = PermissionDescriptor(name=PermissionType.NOTIFICATIONS)
    setting = PermissionSetting.DENIED
    origin = "https://example.com"
    
    command = BrowserCommands.set_permission(
        permission=permission,
        setting=setting,
        origin=origin
    )
    
    assert command['method'] == BrowserMethod.SET_PERMISSION
    assert command['params']['permission'] == permission
    assert command['params']['setting'] == setting
    assert command['params']['origin'] == origin
    assert 'browserContextId' not in command['params']


def test_set_permission_with_all_params():
    """Test set_permission with all parameters."""
    permission = PermissionDescriptor(name=PermissionType.MIDI)
    setting = PermissionSetting.PROMPT
    origin = "https://test.example.com"
    browser_context_id = "permission-context"
    
    command = BrowserCommands.set_permission(
        permission=permission,
        setting=setting,
        origin=origin,
        browser_context_id=browser_context_id
    )
    
    assert command['method'] == BrowserMethod.SET_PERMISSION
    assert command['params']['permission'] == permission
    assert command['params']['setting'] == setting
    assert command['params']['origin'] == origin
    assert command['params']['browserContextId'] == browser_context_id


def test_set_window_fullscreen():
    """Test set_window_fullscreen command generation."""
    window_id = 7
    command = BrowserCommands.set_window_fullscreen(window_id=window_id)
    
    assert command['method'] == BrowserMethod.SET_WINDOW_BOUNDS
    assert command['params']['windowId'] == window_id
    assert command['params']['bounds']['windowState'] == WindowState.FULLSCREEN


def test_set_window_normal():
    """Test set_window_normal command generation."""
    window_id = 8
    command = BrowserCommands.set_window_normal(window_id=window_id)
    
    assert command['method'] == BrowserMethod.SET_WINDOW_BOUNDS
    assert command['params']['windowId'] == window_id
    assert command['params']['bounds']['windowState'] == WindowState.NORMAL


# Additional edge case and integration tests

def test_all_window_state_helpers():
    """Test all window state helper methods."""
    window_id = 99
    
    # Test all window state helpers return correct commands
    maximized = BrowserCommands.set_window_maximized(window_id)
    minimized = BrowserCommands.set_window_minimized(window_id)
    fullscreen = BrowserCommands.set_window_fullscreen(window_id)
    normal = BrowserCommands.set_window_normal(window_id)
    
    # All should use the same method
    for command in [maximized, minimized, fullscreen, normal]:
        assert command['method'] == BrowserMethod.SET_WINDOW_BOUNDS
        assert command['params']['windowId'] == window_id
    
    # Check specific states
    assert maximized['params']['bounds']['windowState'] == WindowState.MAXIMIZED
    assert minimized['params']['bounds']['windowState'] == WindowState.MINIMIZED
    assert fullscreen['params']['bounds']['windowState'] == WindowState.FULLSCREEN
    assert normal['params']['bounds']['windowState'] == WindowState.NORMAL


def test_privacy_sandbox_apis():
    """Test privacy sandbox with different API types."""
    coordinator_origin = "https://api.test"
    key_config = "test-config"
    
    # Test BIDDING_AND_AUCTION_SERVICES API
    bidding_cmd = BrowserCommands.add_privacy_sandbox_coordinator_key_config(
        api=PrivacySandboxAPI.BIDDING_AND_AUCTION_SERVICES,
        coordinator_origin=coordinator_origin,
        key_config=key_config
    )
    assert bidding_cmd['params']['api'] == PrivacySandboxAPI.BIDDING_AND_AUCTION_SERVICES
    
    # Test TRUSTED_KEY_VALUE API  
    trusted_key_cmd = BrowserCommands.add_privacy_sandbox_coordinator_key_config(
        api=PrivacySandboxAPI.TRUSTED_KEY_VALUE,
        coordinator_origin=coordinator_origin,
        key_config=key_config
    )
    assert trusted_key_cmd['params']['api'] == PrivacySandboxAPI.TRUSTED_KEY_VALUE


def test_permission_settings_variations():
    """Test set_permission with different permission settings."""
    permission = PermissionDescriptor(name=PermissionType.GEOLOCATION)
    
    # Test GRANTED setting
    granted_cmd = BrowserCommands.set_permission(permission, PermissionSetting.GRANTED)
    assert granted_cmd['params']['setting'] == PermissionSetting.GRANTED
    
    # Test DENIED setting
    denied_cmd = BrowserCommands.set_permission(permission, PermissionSetting.DENIED)
    assert denied_cmd['params']['setting'] == PermissionSetting.DENIED
    
    # Test PROMPT setting
    prompt_cmd = BrowserCommands.set_permission(permission, PermissionSetting.PROMPT)
    assert prompt_cmd['params']['setting'] == PermissionSetting.PROMPT


def test_browser_command_ids():
    """Test execute_browser_command with different command IDs."""
    # Test different browser command IDs
    tab_search_cmd = BrowserCommands.execute_browser_command(BrowserCommandId.OPEN_TAB_SEARCH)
    assert tab_search_cmd['params']['commandId'] == BrowserCommandId.OPEN_TAB_SEARCH


================================================
FILE: tests/test_commands/test_dom_commands.py
================================================
from pydoll.commands.dom_commands import DomCommands
from pydoll.protocol.dom.methods import DomMethod
from pydoll.protocol.dom.types import IncludeWhitespace, LogicalAxes, PhysicalAxes, RelationType

class TestDomCommands:
    """Tests for the DomCommands class."""

    def test_describe_node_with_node_id(self):
        """Test describe_node command with node_id."""
        result = DomCommands.describe_node(node_id=123)
        
        assert result['method'] == DomMethod.DESCRIBE_NODE
        assert result['params']['nodeId'] == 123

    def test_describe_node_with_backend_node_id(self):
        """Test describe_node command with backend_node_id."""
        result = DomCommands.describe_node(backend_node_id=456)
        
        assert result['method'] == DomMethod.DESCRIBE_NODE
        assert result['params']['backendNodeId'] == 456

    def test_describe_node_with_object_id(self):
        """Test describe_node command with object_id."""
        result = DomCommands.describe_node(object_id='obj123')
        
        assert result['method'] == DomMethod.DESCRIBE_NODE
        assert result['params']['objectId'] == 'obj123'

    def test_describe_node_with_all_params(self):
        """Test describe_node command with all parameters."""
        result = DomCommands.describe_node(
            node_id=123,
            backend_node_id=456,
            object_id='obj123',
            depth=2,
            pierce=True
        )
        
        assert result['method'] == DomMethod.DESCRIBE_NODE
        assert result['params']['nodeId'] == 123
        assert result['params']['backendNodeId'] == 456
        assert result['params']['objectId'] == 'obj123'
        assert result['params']['depth'] == 2
        assert result['params']['pierce'] is True

    def test_disable(self):
        """Test disable command."""
        result = DomCommands.disable()
        
        assert result['method'] == DomMethod.DISABLE
        assert 'params' not in result

    def test_enable_without_params(self):
        """Test enable command without parameters."""
        result = DomCommands.enable()
        
        assert result['method'] == DomMethod.ENABLE
        assert 'params' in result

    def test_enable_with_include_whitespace(self):
        """Test enable command with include_whitespace."""
        result = DomCommands.enable(include_whitespace=IncludeWhitespace.ALL)
        
        assert result['method'] == DomMethod.ENABLE
        assert result['params']['includeWhitespace'] == IncludeWhitespace.ALL

    def test_focus_with_node_id(self):
        """Test focus command with node_id."""
        result = DomCommands.focus(node_id=123)
        
        assert result['method'] == DomMethod.FOCUS
        assert result['params']['nodeId'] == 123

    def test_focus_with_backend_node_id(self):
        """Test focus command with backend_node_id."""
        result = DomCommands.focus(backend_node_id=456)
        
        assert result['method'] == DomMethod.FOCUS
        assert result['params']['backendNodeId'] == 456

    def test_focus_with_object_id(self):
        """Test focus command with object_id."""
        result = DomCommands.focus(object_id='obj123')
        
        assert result['method'] == DomMethod.FOCUS
        assert result['params']['objectId'] == 'obj123'

    def test_get_attributes(self):
        """Test get_attributes command."""
        result = DomCommands.get_attributes(node_id=123)
        
        assert result['method'] == DomMethod.GET_ATTRIBUTES
        assert result['params']['nodeId'] == 123

    def test_get_box_model_with_node_id(self):
        """Test get_box_model command with node_id."""
        result = DomCommands.get_box_model(node_id=123)
        
        assert result['method'] == DomMethod.GET_BOX_MODEL
        assert result['params']['nodeId'] == 123

    def test_get_box_model_with_backend_node_id(self):
        """Test get_box_model command with backend_node_id."""
        result = DomCommands.get_box_model(backend_node_id=456)
        
        assert result['method'] == DomMethod.GET_BOX_MODEL
        assert result['params']['backendNodeId'] == 456

    def test_get_box_model_with_object_id(self):
        """Test get_box_model command with object_id."""
        result = DomCommands.get_box_model(object_id='obj123')
        
        assert result['method'] == DomMethod.GET_BOX_MODEL
        assert result['params']['objectId'] == 'obj123'

    def test_get_document_without_params(self):
        """Test get_document command without parameters."""
        result = DomCommands.get_document()
        
        assert result['method'] == DomMethod.GET_DOCUMENT
        assert 'params' in result

    def test_get_document_with_depth(self):
        """Test get_document command with depth."""
        result = DomCommands.get_document(depth=2)
        
        assert result['method'] == DomMethod.GET_DOCUMENT
        assert result['params']['depth'] == 2

    def test_get_document_with_pierce(self):
        """Test get_document command with pierce."""
        result = DomCommands.get_document(pierce=True)
        
        assert result['method'] == DomMethod.GET_DOCUMENT
        assert result['params']['pierce'] is True

    def test_get_node_for_location(self):
        """Test get_node_for_location command."""
        result = DomCommands.get_node_for_location(x=100, y=200)
        
        assert result['method'] == DomMethod.GET_NODE_FOR_LOCATION
        assert result['params']['x'] == 100
        assert result['params']['y'] == 200

    def test_get_node_for_location_with_optional_params(self):
        """Test get_node_for_location command with optional parameters."""
        result = DomCommands.get_node_for_location(
            x=100, 
            y=200,
            include_user_agent_shadow_dom=True,
            ignore_pointer_events_none=False
        )
        
        assert result['method'] == DomMethod.GET_NODE_FOR_LOCATION
        assert result['params']['x'] == 100
        assert result['params']['y'] == 200
        assert result['params']['includeUserAgentShadowDOM'] is True
        assert result['params']['ignorePointerEventsNone'] is False

    def test_get_outer_html_with_node_id(self):
        """Test get_outer_html command with node_id."""
        result = DomCommands.get_outer_html(node_id=123)
        
        assert result['method'] == DomMethod.GET_OUTER_HTML
        assert result['params']['nodeId'] == 123

    def test_get_outer_html_with_backend_node_id(self):
        """Test get_outer_html command with backend_node_id."""
        result = DomCommands.get_outer_html(backend_node_id=456)
        
        assert result['method'] == DomMethod.GET_OUTER_HTML
        assert result['params']['backendNodeId'] == 456

    def test_get_outer_html_with_object_id(self):
        """Test get_outer_html command with object_id."""
        result = DomCommands.get_outer_html(object_id='obj123')
        
        assert result['method'] == DomMethod.GET_OUTER_HTML
        assert result['params']['objectId'] == 'obj123'

    def test_hide_highlight(self):
        """Test hide_highlight command."""
        result = DomCommands.hide_highlight()
        
        assert result['method'] == DomMethod.HIDE_HIGHLIGHT
        assert 'params' not in result

    def test_highlight_node(self):
        """Test highlight_node command."""
        result = DomCommands.highlight_node()
        
        assert result['method'] == DomMethod.HIGHLIGHT_NODE
        assert 'params' not in result

    def test_highlight_rect(self):
        """Test highlight_rect command."""
        result = DomCommands.highlight_rect()
        
        assert result['method'] == DomMethod.HIGHLIGHT_RECT
        assert 'params' not in result

    def test_move_to(self):
        """Test move_to command."""
        result = DomCommands.move_to(node_id=123, target_node_id=456)
        
        assert result['method'] == DomMethod.MOVE_TO
        assert result['params']['nodeId'] == 123
        assert result['params']['targetNodeId'] == 456

    def test_move_to_with_insert_before(self):
        """Test move_to command with insert_before_node_id."""
        result = DomCommands.move_to(
            node_id=123, 
            target_node_id=456, 
            insert_before_node_id=789
        )
        
        assert result['method'] == DomMethod.MOVE_TO
        assert result['params']['nodeId'] == 123
        assert result['params']['targetNodeId'] == 456
        assert result['params']['insertBeforeNodeId'] == 789

    def test_query_selector(self):
        """Test query_selector command."""
        result = DomCommands.query_selector(node_id=123, selector='.test-class')
        
        assert result['method'] == DomMethod.QUERY_SELECTOR
        assert result['params']['nodeId'] == 123
        assert result['params']['selector'] == '.test-class'

    def test_query_selector_all(self):
        """Test query_selector_all command."""
        result = DomCommands.query_selector_all(node_id=123, selector='div')
        
        assert result['method'] == DomMethod.QUERY_SELECTOR_ALL
        assert result['params']['nodeId'] == 123
        assert result['params']['selector'] == 'div'

    def test_remove_attribute(self):
        """Test remove_attribute command."""
        result = DomCommands.remove_attribute(node_id=123, name='class')
        
        assert result['method'] == DomMethod.REMOVE_ATTRIBUTE
        assert result['params']['nodeId'] == 123
        assert result['params']['name'] == 'class'

    def test_remove_node(self):
        """Test remove_node command."""
        result = DomCommands.remove_node(node_id=123)
        
        assert result['method'] == DomMethod.REMOVE_NODE
        assert result['params']['nodeId'] == 123

    def test_request_child_nodes(self):
        """Test request_child_nodes command."""
        result = DomCommands.request_child_nodes(node_id=123)
        
        assert result['method'] == DomMethod.REQUEST_CHILD_NODES
        assert result['params']['nodeId'] == 123

    def test_request_child_nodes_with_depth(self):
        """Test request_child_nodes command with depth."""
        result = DomCommands.request_child_nodes(node_id=123, depth=2)
        
        assert result['method'] == DomMethod.REQUEST_CHILD_NODES
        assert result['params']['nodeId'] == 123
        assert result['params']['depth'] == 2

    def test_request_child_nodes_with_pierce(self):
        """Test request_child_nodes command with pierce."""
        result = DomCommands.request_child_nodes(node_id=123, pierce=True)
        
        assert result['method'] == DomMethod.REQUEST_CHILD_NODES
        assert result['params']['nodeId'] == 123
        assert result['params']['pierce'] is True

    def test_request_node(self):
        """Test request_node command."""
        result = DomCommands.request_node(object_id='obj123')
        
        assert result['method'] == DomMethod.REQUEST_NODE
        assert result['params']['objectId'] == 'obj123'

    def test_resolve_node_with_node_id(self):
        """Test resolve_node command with node_id."""
        result = DomCommands.resolve_node(node_id=123)
        
        assert result['method'] == DomMethod.RESOLVE_NODE
        assert result['params']['nodeId'] == 123

    def test_resolve_node_with_backend_node_id(self):
        """Test resolve_node command with backend_node_id."""
        result = DomCommands.resolve_node(backend_node_id=456)
        
        assert result['method'] == DomMethod.RESOLVE_NODE
        assert result['params']['backendNodeId'] == 456

    def test_resolve_node_with_all_params(self):
        """Test resolve_node command with all parameters."""
        result = DomCommands.resolve_node(
            node_id=123,
            backend_node_id=456,
            object_group='test-group',
            execution_context_id=789
        )
        
        assert result['method'] == DomMethod.RESOLVE_NODE
        assert result['params']['nodeId'] == 123
        assert result['params']['backendNodeId'] == 456
        assert result['params']['objectGroup'] == 'test-group'
        assert result['params']['executionContextId'] == 789

    def test_scroll_into_view_if_needed_with_node_id(self):
        """Test scroll_into_view_if_needed command with node_id."""
        result = DomCommands.scroll_into_view_if_needed(node_id=123)
        
        assert result['method'] == DomMethod.SCROLL_INTO_VIEW_IF_NEEDED
        assert result['params']['nodeId'] == 123

    def test_scroll_into_view_if_needed_with_backend_node_id(self):
        """Test scroll_into_view_if_needed command with backend_node_id."""
        result = DomCommands.scroll_into_view_if_needed(backend_node_id=456)
        
        assert result['method'] == DomMethod.SCROLL_INTO_VIEW_IF_NEEDED
        assert result['params']['backendNodeId'] == 456

    def test_scroll_into_view_if_needed_with_object_id(self):
        """Test scroll_into_view_if_needed command with object_id."""
        result = DomCommands.scroll_into_view_if_needed(object_id='obj123')
        
        assert result['method'] == DomMethod.SCROLL_INTO_VIEW_IF_NEEDED
        assert result['params']['objectId'] == 'obj123'

    def test_set_attributes_as_text(self):
        """Test set_attributes_as_text command."""
        result = DomCommands.set_attributes_as_text(node_id=123, text='class="test"')
        
        assert result['method'] == DomMethod.SET_ATTRIBUTES_AS_TEXT
        assert result['params']['nodeId'] == 123
        assert result['params']['text'] == 'class="test"'

    def test_set_attributes_as_text_with_name(self):
        """Test set_attributes_as_text command with name."""
        result = DomCommands.set_attributes_as_text(
            node_id=123, 
            text='test-value', 
            name='class'
        )
        
        assert result['method'] == DomMethod.SET_ATTRIBUTES_AS_TEXT
        assert result['params']['nodeId'] == 123
        assert result['params']['text'] == 'test-value'
        assert result['params']['name'] == 'class'

    def test_set_attribute_value(self):
        """Test set_attribute_value command."""
        result = DomCommands.set_attribute_value(
            node_id=123, 
            name='class', 
            value='test-class'
        )
        
        assert result['method'] == DomMethod.SET_ATTRIBUTE_VALUE
        assert result['params']['nodeId'] == 123
        assert result['params']['name'] == 'class'
        assert result['params']['value'] == 'test-class'

    def test_set_file_input_files_with_node_id(self):
        """Test set_file_input_files command with node_id."""
        files = ['/path/to/file1.txt', '/path/to/file2.txt']
        result = DomCommands.set_file_input_files(files=files, node_id=123)
        
        assert result['method'] == DomMethod.SET_FILE_INPUT_FILES
        assert result['params']['files'] == files
        assert result['params']['nodeId'] == 123

    def test_set_file_input_files_with_backend_node_id(self):
        """Test set_file_input_files command with backend_node_id."""
        files = ['/path/to/file.txt']
        result = DomCommands.set_file_input_files(files=files, backend_node_id=456)
        
        assert result['method'] == DomMethod.SET_FILE_INPUT_FILES
        assert result['params']['files'] == files
        assert result['params']['backendNodeId'] == 456

    def test_set_file_input_files_with_object_id(self):
        """Test set_file_input_files command with object_id."""
        files = ['/path/to/file.txt']
        result = DomCommands.set_file_input_files(files=files, object_id='obj123')
        
        assert result['method'] == DomMethod.SET_FILE_INPUT_FILES
        assert result['params']['files'] == files
        assert result['params']['objectId'] == 'obj123'

    def test_set_node_name(self):
        """Test set_node_name command."""
        result = DomCommands.set_node_name(node_id=123, name='div')
        
        assert result['method'] == DomMethod.SET_NODE_NAME
        assert result['params']['nodeId'] == 123
        assert result['params']['name'] == 'div'

    def test_set_node_value(self):
        """Test set_node_value command."""
        result = DomCommands.set_node_value(node_id=123, value='test text')
        
        assert result['method'] == DomMethod.SET_NODE_VALUE
        assert result['params']['nodeId'] == 123
        assert result['params']['value'] == 'test text'

    def test_set_outer_html(self):
        """Test set_outer_html command."""
        html = '<div class="test">content</div>'
        result = DomCommands.set_outer_html(node_id=123, outer_html=html)
        
        assert result['method'] == DomMethod.SET_OUTER_HTML
        assert result['params']['nodeId'] == 123
        assert result['params']['outerHTML'] == html

    def test_collect_class_names_from_subtree(self):
        """Test collect_class_names_from_subtree command."""
        result = DomCommands.collect_class_names_from_subtree(node_id=123)
        
        assert result['method'] == DomMethod.COLLECT_CLASS_NAMES_FROM_SUBTREE
        assert result['params']['nodeId'] == 123

    def test_copy_to(self):
        """Test copy_to command."""
        result = DomCommands.copy_to(node_id=123, target_node_id=456)
        
        assert result['method'] == DomMethod.COPY_TO
        assert result['params']['nodeId'] == 123
        assert result['params']['targetNodeId'] == 456

    def test_copy_to_with_insert_before(self):
        """Test copy_to command with insert_before_node_id."""
        result = DomCommands.copy_to(
            node_id=123, 
            target_node_id=456, 
            insert_before_node_id=789
        )
        
        assert result['method'] == DomMethod.COPY_TO
        assert result['params']['nodeId'] == 123
        assert result['params']['targetNodeId'] == 456
        assert result['params']['insertBeforeNodeId'] == 789

    def test_discard_search_results(self):
        """Test discard_search_results command."""
        result = DomCommands.discard_search_results(search_id='search123')
        
        assert result['method'] == DomMethod.DISCARD_SEARCH_RESULTS
        assert result['params']['searchId'] == 'search123'

    def test_get_anchor_element(self):
        """Test get_anchor_element command."""
        result = DomCommands.get_anchor_element(node_id=123)
        
        assert result['method'] == DomMethod.GET_ANCHOR_ELEMENT
        assert result['params']['nodeId'] == 123

    def test_get_anchor_element_with_specifier(self):
        """Test get_anchor_element command with anchor_specifier."""
        result = DomCommands.get_anchor_element(
            node_id=123, 
            anchor_specifier='href'
        )
        
        assert result['method'] == DomMethod.GET_ANCHOR_ELEMENT
        assert result['params']['nodeId'] == 123
        assert result['params']['anchorSpecifier'] == 'href'

    def test_get_container_for_node(self):
        """Test get_container_for_node command."""
        result = DomCommands.get_container_for_node(node_id=123)
        
        assert result['method'] == DomMethod.GET_CONTAINER_FOR_NODE
        assert result['params']['nodeId'] == 123

    def test_get_container_for_node_with_all_params(self):
        """Test get_container_for_node command with all parameters."""
        result = DomCommands.get_container_for_node(
            node_id=123,
            container_name='scrollable',
            physical_axes=PhysicalAxes.HORIZONTAL,
            logical_axes=LogicalAxes.INLINE,
            queries_scroll_state=True
        )
        
        assert result['method'] == DomMethod.GET_CONTAINER_FOR_NODE
        assert result['params']['nodeId'] == 123
        assert result['params']['containerName'] == 'scrollable'
        assert result['params']['physicalAxes'] == PhysicalAxes.HORIZONTAL
        assert result['params']['logicalAxes'] == LogicalAxes.INLINE
        assert result['params']['queriesScrollState'] is True

    def test_get_content_quads_with_node_id(self):
        """Test get_content_quads command with node_id."""
        result = DomCommands.get_content_quads(node_id=123)
        
        assert result['method'] == DomMethod.GET_CONTENT_QUADS
        assert result['params']['nodeId'] == 123

    def test_get_content_quads_with_backend_node_id(self):
        """Test get_content_quads command with backend_node_id."""
        result = DomCommands.get_content_quads(backend_node_id=456)
        
        assert result['method'] == DomMethod.GET_CONTENT_QUADS
        assert result['params']['backendNodeId'] == 456

    def test_get_content_quads_with_object_id(self):
        """Test get_content_quads command with object_id."""
        result = DomCommands.get_content_quads(object_id='obj123')
        
        assert result['method'] == DomMethod.GET_CONTENT_QUADS
        assert result['params']['objectId'] == 'obj123'

    def test_get_detached_dom_nodes(self):
        """Test get_detached_dom_nodes command."""
        result = DomCommands.get_detached_dom_nodes()
        
        assert result['method'] == DomMethod.GET_DETACHED_DOM_NODES
        assert 'params' not in result

    def test_get_element_by_relation(self):
        """Test get_element_by_relation command."""
        result = DomCommands.get_element_by_relation(
            node_id=123, 
            relation=RelationType.INTEREST_TARGET
        )
        
        assert result['method'] == DomMethod.GET_ELEMENT_BY_RELATION
        assert result['params']['nodeId'] == 123
        assert result['params']['relation'] == RelationType.INTEREST_TARGET

    def test_get_file_info(self):
        """Test get_file_info command."""
        result = DomCommands.get_file_info(object_id='file123')
        
        assert result['method'] == DomMethod.GET_FILE_INFO
        assert result['params']['objectId'] == 'file123'

    def test_get_frame_owner(self):
        """Test get_frame_owner command."""
        result = DomCommands.get_frame_owner(frame_id='frame123')
        
        assert result['method'] == DomMethod.GET_FRAME_OWNER
        assert result['params']['frameId'] == 'frame123'

    def test_get_nodes_for_subtree_by_style(self):
        """Test get_nodes_for_subtree_by_style command."""
        computed_styles = [{'name': 'color', 'value': 'red'}]
        result = DomCommands.get_nodes_for_subtree_by_style(
            node_id=123, 
            computed_styles=computed_styles
        )
        
        assert result['method'] == DomMethod.GET_NODES_FOR_SUBTREE_BY_STYLE
        assert result['params']['nodeId'] == 123
        assert result['params']['computedStyles'] == computed_styles

    def test_get_nodes_for_subtree_by_style_with_pierce(self):
        """Test get_nodes_for_subtree_by_style command with pierce."""
        computed_styles = [{'name': 'display', 'value': 'block'}]
        result = DomCommands.get_nodes_for_subtree_by_style(
            node_id=123, 
            computed_styles=computed_styles,
            pierce=True
        )
        
        assert result['method'] == DomMethod.GET_NODES_FOR_SUBTREE_BY_STYLE
        assert result['params']['nodeId'] == 123
        assert result['params']['computedStyles'] == computed_styles
        assert result['params']['pierce'] is True

    def test_get_node_stack_traces(self):
        """Test get_node_stack_traces command."""
        result = DomCommands.get_node_stack_traces(node_id=123)
        
        assert result['method'] == DomMethod.GET_NODE_STACK_TRACES
        assert result['params']['nodeId'] == 123

    def test_get_querying_descendants_for_container(self):
        """Test get_querying_descendants_for_container command."""
        result = DomCommands.get_querying_descendants_for_container(node_id=123)
        
        assert result['method'] == DomMethod.GET_QUERYING_DESCENDANTS_FOR_CONTAINER
        assert result['params']['nodeId'] == 123

    def test_get_relayout_boundary(self):
        """Test get_relayout_boundary command."""
        result = DomCommands.get_relayout_boundary(node_id=123)
        
        assert result['method'] == DomMethod.GET_RELAYOUT_BOUNDARY
        assert result['params']['nodeId'] == 123

    def test_get_search_results(self):
        """Test get_search_results command."""
        result = DomCommands.get_search_results(
            search_id='search123', 
            from_index=0, 
            to_index=10
        )
        
        assert result['method'] == DomMethod.GET_SEARCH_RESULTS
        assert result['params']['searchId'] == 'search123'
        assert result['params']['fromIndex'] == 0
        assert result['params']['toIndex'] == 10

    def test_get_top_layer_elements(self):
        """Test get_top_layer_elements command."""
        result = DomCommands.get_top_layer_elements()
        
        assert result['method'] == DomMethod.GET_TOP_LAYER_ELEMENTS
        assert 'params' not in result

    def test_mark_undoable_state(self):
        """Test mark_undoable_state command."""
        result = DomCommands.mark_undoable_state()
        
        assert result['method'] == DomMethod.MARK_UNDOABLE_STATE
        assert 'params' not in result

    def test_perform_search(self):
        """Test perform_search command."""
        result = DomCommands.perform_search(query='test')
        
        assert result['method'] == DomMethod.PERFORM_SEARCH
        assert result['params']['query'] == 'test'

    def test_perform_search_with_shadow_dom(self):
        """Test perform_search command with include_user_agent_shadow_dom."""
        result = DomCommands.perform_search(
            query='test', 
            include_user_agent_shadow_dom=True
        )
        
        assert result['method'] == DomMethod.PERFORM_SEARCH
        assert result['params']['query'] == 'test'
        assert result['params']['includeUserAgentShadowDOM'] is True

    def test_push_node_by_path_to_frontend(self):
        """Test push_node_by_path_to_frontend command."""
        result = DomCommands.push_node_by_path_to_frontend(path='1,2,3')
        
        assert result['method'] == DomMethod.PUSH_NODE_BY_PATH_TO_FRONTEND
        assert result['params']['path'] == '1,2,3'

    def test_push_nodes_by_backend_ids_to_frontend(self):
        """Test push_nodes_by_backend_ids_to_frontend command."""
        backend_ids = [123, 456, 789]
        result = DomCommands.push_nodes_by_backend_ids_to_frontend(
            backend_node_ids=backend_ids
        )
        
        assert result['method'] == DomMethod.PUSH_NODES_BY_BACKEND_IDS_TO_FRONTEND
        assert result['params']['backendNodeIds'] == backend_ids

    def test_redo(self):
        """Test redo command."""
        result = DomCommands.redo()
        
        assert result['method'] == DomMethod.REDO
        assert 'params' not in result

    def test_set_inspected_node(self):
        """Test set_inspected_node command."""
        result = DomCommands.set_inspected_node(node_id=123)
        
        assert result['method'] == DomMethod.SET_INSPECTED_NODE
        assert result['params']['nodeId'] == 123

    def test_set_node_stack_traces_enabled(self):
        """Test set_node_stack_traces_enabled command."""
        result = DomCommands.set_node_stack_traces_enabled(enable=True)
        
        assert result['method'] == DomMethod.SET_NODE_STACK_TRACES_ENABLED
        assert result['params']['enable'] is True

    def test_undo(self):
        """Test undo command."""
        result = DomCommands.undo()
        
        assert result['method'] == DomMethod.UNDO
        assert 'params' not in result


================================================
FILE: tests/test_commands/test_emulation_commands.py
================================================
"""
Tests for EmulationCommands class.

This module contains tests for all EmulationCommands methods,
verifying that they generate the correct CDP commands with proper parameters.
"""

from pydoll.commands.emulation_commands import EmulationCommands
from pydoll.protocol.emulation.methods import EmulationMethod
from pydoll.protocol.emulation.types import UserAgentBrandVersion, UserAgentMetadata


def test_set_user_agent_override_minimal():
    """Test set_user_agent_override with only required parameter."""
    result = EmulationCommands.set_user_agent_override(user_agent='Test/1.0')
    assert result['method'] == EmulationMethod.SET_USER_AGENT_OVERRIDE
    assert result['params']['userAgent'] == 'Test/1.0'
    assert 'acceptLanguage' not in result['params']
    assert 'platform' not in result['params']
    assert 'userAgentMetadata' not in result['params']


def test_set_user_agent_override_with_accept_language():
    """Test set_user_agent_override with acceptLanguage parameter."""
    result = EmulationCommands.set_user_agent_override(
        user_agent='Test/1.0',
        accept_language='en-US,en;q=0.9',
    )
    assert result['params']['userAgent'] == 'Test/1.0'
    assert result['params']['acceptLanguage'] == 'en-US,en;q=0.9'


def test_set_user_agent_override_with_platform():
    """Test set_user_agent_override with platform parameter."""
    result = EmulationCommands.set_user_agent_override(
        user_agent='Test/1.0',
        platform='Win32',
    )
    assert result['params']['userAgent'] == 'Test/1.0'
    assert result['params']['platform'] == 'Win32'


def test_set_user_agent_override_with_metadata():
    """Test set_user_agent_override with full userAgentMetadata."""
    metadata = UserAgentMetadata(
        platform='Windows',
        platformVersion='15.0.0',
        architecture='x86',
        model='',
        mobile=False,
        brands=[
            UserAgentBrandVersion(brand='Not/A)Brand', version='20'),
            UserAgentBrandVersion(brand='Chromium', version='120'),
            UserAgentBrandVersion(brand='Google Chrome', version='120'),
        ],
        fullVersionList=[
            UserAgentBrandVersion(brand='Not/A)Brand', version='20.0.0.0'),
            UserAgentBrandVersion(brand='Chromium', version='120.0.6099.109'),
            UserAgentBrandVersion(brand='Google Chrome', version='120.0.6099.109'),
        ],
        bitness='64',
        wow64=False,
    )
    result = EmulationCommands.set_user_agent_override(
        user_agent='Mozilla/5.0 Chrome/120.0.6099.109',
        platform='Win32',
        user_agent_metadata=metadata,
    )
    assert result['method'] == EmulationMethod.SET_USER_AGENT_OVERRIDE
    assert result['params']['userAgent'] == 'Mozilla/5.0 Chrome/120.0.6099.109'
    assert result['params']['platform'] == 'Win32'
    assert result['params']['userAgentMetadata']['platform'] == 'Windows'
    assert result['params']['userAgentMetadata']['mobile'] is False
    assert len(result['params']['userAgentMetadata']['brands']) == 3
    assert result['params']['userAgentMetadata']['brands'][1]['brand'] == 'Chromium'


def test_set_user_agent_override_with_all_params():
    """Test set_user_agent_override with all parameters set."""
    metadata = UserAgentMetadata(
        platform='Android',
        platformVersion='14.0.0',
        architecture='arm',
        model='Pixel 7',
        mobile=True,
        bitness='64',
        wow64=False,
    )
    result = EmulationCommands.set_user_agent_override(
        user_agent='Mozilla/5.0 (Linux; Android 14)',
        accept_language='pt-BR,pt;q=0.9',
        platform='Linux armv81',
        user_agent_metadata=metadata,
    )
    assert result['params']['userAgent'] == 'Mozilla/5.0 (Linux; Android 14)'
    assert result['params']['acceptLanguage'] == 'pt-BR,pt;q=0.9'
    assert result['params']['platform'] == 'Linux armv81'
    assert result['params']['userAgentMetadata']['mobile'] is True
    assert result['params']['userAgentMetadata']['model'] == 'Pixel 7'


def test_set_user_agent_override_none_params_excluded():
    """Test that None parameters are not included in the command."""
    result = EmulationCommands.set_user_agent_override(
        user_agent='Test/1.0',
        accept_language=None,
        platform=None,
        user_agent_metadata=None,
    )
    assert 'acceptLanguage' not in result['params']
    assert 'platform' not in result['params']
    assert 'userAgentMetadata' not in result['params']


================================================
FILE: tests/test_commands/test_fetch_commands.py
================================================
import pytest
from pydoll.commands.fetch_commands import FetchCommands
from pydoll.protocol.fetch.types import AuthChallengeResponseType, RequestStage
from pydoll.protocol.network.types import RequestMethod, ErrorReason, ResourceType
from pydoll.protocol.fetch.methods import FetchMethod


class TestFetchCommands:
    """Tests for the FetchCommands class."""

    def test_continue_request_minimal(self):
        """Test continue_request command with minimal parameters."""
        request_id = 'req123'
        result = FetchCommands.continue_request(request_id=request_id)
        
        assert result['method'] == FetchMethod.CONTINUE_REQUEST
        assert result['params']['requestId'] == request_id

    def test_continue_request_with_url(self):
        """Test continue_request command with URL."""
        request_id = 'req123'
        url = 'https://example.com'
        result = FetchCommands.continue_request(request_id=request_id, url=url)
        
        assert result['method'] == FetchMethod.CONTINUE_REQUEST
        assert result['params']['requestId'] == request_id
        assert result['params']['url'] == url

    def test_continue_request_with_method(self):
        """Test continue_request command with HTTP method."""
        request_id = 'req123'
        method = RequestMethod.POST
        result = FetchCommands.continue_request(request_id=request_id, method=method)
        
        assert result['method'] == FetchMethod.CONTINUE_REQUEST
        assert result['params']['requestId'] == request_id
        assert result['params']['method'] == method

    def test_continue_request_with_post_data(self):
        """Test continue_request command with POST data."""
        request_id = 'req123'
        post_data = '{"key": "value"}'
        result = FetchCommands.continue_request(request_id=request_id, post_data=post_data)
        
        assert result['method'] == FetchMethod.CONTINUE_REQUEST
        assert result['params']['requestId'] == request_id
        assert result['params']['postData'] == post_data

    def test_continue_request_with_headers(self):
        """Test continue_request command with headers."""
        request_id = 'req123'
        headers = [{'name': 'Content-Type', 'value': 'application/json'}]
        result = FetchCommands.continue_request(request_id=request_id, headers=headers)
        
        assert result['method'] == FetchMethod.CONTINUE_REQUEST
        assert result['params']['requestId'] == request_id
        assert result['params']['headers'] == headers

    def test_continue_request_with_intercept_response(self):
        """Test continue_request command with intercept_response."""
        request_id = 'req123'
        intercept_response = True
        result = FetchCommands.continue_request(
            request_id=request_id, 
            intercept_response=intercept_response
        )
        
        assert result['method'] == FetchMethod.CONTINUE_REQUEST
        assert result['params']['requestId'] == request_id
        assert result['params']['interceptResponse'] == intercept_response

    def test_continue_request_with_all_params(self):
        """Test continue_request command with all parameters."""
        request_id = 'req123'
        url = 'https://example.com'
        method = RequestMethod.PUT
        post_data = '{"data": "test"}'
        headers = [{'name': 'Authorization', 'value': 'Bearer token'}]
        intercept_response = False
        
        result = FetchCommands.continue_request(
            request_id=request_id,
            url=url,
            method=method,
            post_data=post_data,
            headers=headers,
            intercept_response=intercept_response
        )
        
        assert result['method'] == FetchMethod.CONTINUE_REQUEST
        assert result['params']['requestId'] == request_id
        assert result['params']['url'] == url
        assert result['params']['method'] == method
        assert result['params']['postData'] == post_data
        assert result['params']['headers'] == headers
        assert result['params']['interceptResponse'] == intercept_response

    def test_continue_request_with_auth_minimal(self):
        """Test continue_request_with_auth command with minimal parameters."""
        request_id = 'req123'
        auth_response = AuthChallengeResponseType.PROVIDE_CREDENTIALS
        result = FetchCommands.continue_request_with_auth(
            request_id=request_id,
            auth_challenge_response=auth_response
        )
        
        assert result['method'] == FetchMethod.CONTINUE_WITH_AUTH
        assert result['params']['requestId'] == request_id
        assert result['params']['authChallengeResponse']['response'] == auth_response

    def test_continue_request_with_auth_credentials(self):
        """Test continue_request_with_auth command with credentials."""
        request_id = 'req123'
        auth_response = AuthChallengeResponseType.PROVIDE_CREDENTIALS
        username = 'testuser'
        password = 'testpass'
        
        result = FetchCommands.continue_request_with_auth(
            request_id=request_id,
            auth_challenge_response=auth_response,
            proxy_username=username,
            proxy_password=password
        )
        
        assert result['method'] == FetchMethod.CONTINUE_WITH_AUTH
        assert result['params']['requestId'] == request_id
        assert result['params']['authChallengeResponse']['response'] == auth_response
        assert result['params']['authChallengeResponse']['username'] == username
        assert result['params']['authChallengeResponse']['password'] == password

    def test_continue_request_with_auth_cancel(self):
        """Test continue_request_with_auth command with cancel response."""
        request_id = 'req123'
        auth_response = AuthChallengeResponseType.CANCEL_AUTH
        
        result = FetchCommands.continue_request_with_auth(
            request_id=request_id,
            auth_challenge_response=auth_response
        )
        
        assert result['method'] == FetchMethod.CONTINUE_WITH_AUTH
        assert result['params']['requestId'] == request_id
        assert result['params']['authChallengeResponse']['response'] == auth_response

    def test_disable(self):
        """Test disable command."""
        result = FetchCommands.disable()
        
        assert result['method'] == FetchMethod.DISABLE
        assert 'params' not in result

    def test_enable_minimal(self):
        """Test enable command with minimal parameters."""
        handle_auth = True
        result = FetchCommands.enable(handle_auth_requests=handle_auth)
        
        assert result['method'] == FetchMethod.ENABLE
        assert result['params']['handleAuthRequests'] == handle_auth
        assert result['params']['patterns'][0]['urlPattern'] == '*'

    def test_enable_with_url_pattern(self):
        """Test enable command with custom URL pattern."""
        handle_auth = False
        url_pattern = 'https://api.example.com/*'
        result = FetchCommands.enable(
            handle_auth_requests=handle_auth,
            url_pattern=url_pattern
        )
        
        assert result['method'] == FetchMethod.ENABLE
        assert result['params']['handleAuthRequests'] == handle_auth
        assert result['params']['patterns'][0]['urlPattern'] == url_pattern

    def test_enable_with_resource_type(self):
        """Test enable command with resource type."""
        handle_auth = True
        resource_type = ResourceType.DOCUMENT
        result = FetchCommands.enable(
            handle_auth_requests=handle_auth,
            resource_type=resource_type
        )
        
        assert result['method'] == FetchMethod.ENABLE
        assert result['params']['handleAuthRequests'] == handle_auth
        assert result['params']['patterns'][0]['resourceType'] == resource_type

    def test_enable_with_request_stage(self):
        """Test enable command with request stage."""
        handle_auth = True
        request_stage = RequestStage.REQUEST
        result = FetchCommands.enable(
            handle_auth_requests=handle_auth,
            request_stage=request_stage
        )
        
        assert result['method'] == FetchMethod.ENABLE
        assert result['params']['handleAuthRequests'] == handle_auth
        assert result['params']['patterns'][0]['requestStage'] == request_stage

    def test_enable_with_all_params(self):
        """Test enable command with all parameters."""
        handle_auth = True
        url_pattern = 'https://test.com/*'
        resource_type = ResourceType.XHR
        request_stage = RequestStage.RESPONSE
        
        result = FetchCommands.enable(
            handle_auth_requests=handle_auth,
            url_pattern=url_pattern,
            resource_type=resource_type,
            request_stage=request_stage
        )
        
        assert result['method'] == FetchMethod.ENABLE
        assert result['params']['handleAuthRequests'] == handle_auth
        assert result['params']['patterns'][0]['urlPattern'] == url_pattern
        assert result['params']['patterns'][0]['resourceType'] == resource_type
        assert result['params']['patterns'][0]['requestStage'] == request_stage

    def test_fail_request(self):
        """Test fail_request command."""
        request_id = 'req123'
        error_reason = ErrorReason.FAILED
        result = FetchCommands.fail_request(
            request_id=request_id,
            error_reason=error_reason
        )
        
        assert result['method'] == FetchMethod.FAIL_REQUEST
        assert result['params']['requestId'] == request_id
        assert result['params']['errorReason'] == error_reason

    def test_fail_request_with_different_error(self):
        """Test fail_request command with different error reason."""
        request_id = 'req123'
        error_reason = ErrorReason.TIMED_OUT
        result = FetchCommands.fail_request(
            request_id=request_id,
            error_reason=error_reason
        )
        
        assert result['method'] == FetchMethod.FAIL_REQUEST
        assert result['params']['requestId'] == request_id
        assert result['params']['errorReason'] == error_reason

    def test_fulfill_request_minimal(self):
        """Test fulfill_request command with minimal parameters."""
        request_id = 'req123'
        response_code = 200
        result = FetchCommands.fulfill_request(
            request_id=request_id,
            response_code=response_code
        )
        
        assert result['method'] == FetchMethod.FULFILL_REQUEST
        assert result['params']['requestId'] == request_id
        assert result['params']['responseCode'] == response_code

    def test_fulfill_request_with_headers(self):
        """Test fulfill_request command with response headers."""
        request_id = 'req123'
        response_code = 201
        headers = [{'name': 'Content-Type', 'value': 'application/json'}]
        result = FetchCommands.fulfill_request(
            request_id=request_id,
            response_code=response_code,
            response_headers=headers
        )
        
        assert result['method'] == FetchMethod.FULFILL_REQUEST
        assert result['params']['requestId'] == request_id
        assert result['params']['responseCode'] == response_code
        assert result['params']['responseHeaders'] == headers

    def test_fulfill_request_with_body(self):
        """Test fulfill_request command with response body."""
        request_id = 'req123'
        response_code = 200
        body = {'message': 'success'}
        result = FetchCommands.fulfill_request(
            request_id=request_id,
            response_code=response_code,
            body=body
        )
        
        assert result['method'] == FetchMethod.FULFILL_REQUEST
        assert result['params']['requestId'] == request_id
        assert result['params']['responseCode'] == response_code
        assert result['params']['body'] == body

    def test_fulfill_request_with_response_phrase(self):
        """Test fulfill_request command with response phrase."""
        request_id = 'req123'
        response_code = 404
        response_phrase = 'Not Found'
        result = FetchCommands.fulfill_request(
            request_id=request_id,
            response_code=response_code,
            response_phrase=response_phrase
        )
        
        assert result['method'] == FetchMethod.FULFILL_REQUEST
        assert result['params']['requestId'] == request_id
        assert result['params']['responseCode'] == response_code
        assert result['params']['responsePhrase'] == response_phrase

    def test_fulfill_request_with_all_params(self):
        """Test fulfill_request command with all parameters."""
        request_id = 'req123'
        response_code = 500
        headers = [{'name': 'Server', 'value': 'nginx'}]
        body = {'error': 'Internal Server Error'}
        response_phrase = 'Internal Server Error'
        
        result = FetchCommands.fulfill_request(
            request_id=request_id,
            response_code=response_code,
            response_headers=headers,
            body=body,
            response_phrase=response_phrase
        )
        
        assert result['method'] == FetchMethod.FULFILL_REQUEST
        assert result['params']['requestId'] == request_id
        assert result['params']['responseCode'] == response_code
        assert result['params']['responseHeaders'] == headers
        assert result['params']['body'] == body
        assert result['params']['responsePhrase'] == response_phrase

    def test_get_response_body(self):
        """Test get_response_body command."""
        request_id = 'req123'
        result = FetchCommands.get_response_body(request_id=request_id)
        
        assert result['method'] == FetchMethod.GET_RESPONSE_BODY
        assert result['params']['requestId'] == request_id

    def test_continue_response_minimal(self):
        """Test continue_response command with minimal parameters."""
        request_id = 'req123'
        result = FetchCommands.continue_response(request_id=request_id)
        
        assert result['method'] == FetchMethod.CONTINUE_RESPONSE
        assert result['params']['requestId'] == request_id

    def test_continue_response_with_code(self):
        """Test continue_response command with response code."""
        request_id = 'req123'
        response_code = 302
        result = FetchCommands.continue_response(
            request_id=request_id,
            response_code=response_code
        )
        
        assert result['method'] == FetchMethod.CONTINUE_RESPONSE
        assert result['params']['requestId'] == request_id
        assert result['params']['responseCode'] == response_code

    def test_continue_response_with_headers(self):
        """Test continue_response command with headers."""
        request_id = 'req123'
        headers = [{'name': 'Location', 'value': 'https://redirect.com'}]
        result = FetchCommands.continue_response(
            request_id=request_id,
            response_headers=headers
        )
        
        assert result['method'] == FetchMethod.CONTINUE_RESPONSE
        assert result['params']['requestId'] == request_id
        assert result['params']['responseHeaders'] == headers

    def test_continue_response_with_phrase(self):
        """Test continue_response command with response phrase."""
        request_id = 'req123'
        response_phrase = 'Found'
        result = FetchCommands.continue_response(
            request_id=request_id,
            response_phrase=response_phrase
        )
        
        assert result['method'] == FetchMethod.CONTINUE_RESPONSE
        assert result['params']['requestId'] == request_id
        assert result['params']['responsePhrase'] == response_phrase

    def test_continue_response_with_all_params(self):
        """Test continue_response command with all parameters."""
        request_id = 'req123'
        response_code = 301
        headers = [{'name': 'Location', 'value': 'https://new-location.com'}]
        response_phrase = 'Moved Permanently'
        
        result = FetchCommands.continue_response(
            request_id=request_id,
            response_code=response_code,
            response_headers=headers,
            response_phrase=response_phrase
        )
        
        assert result['method'] == FetchMethod.CONTINUE_RESPONSE
        assert result['params']['requestId'] == request_id
        assert result['params']['responseCode'] == response_code
        assert result['params']['responseHeaders'] == headers
        assert result['params']['responsePhrase'] == response_phrase

    def test_take_response_body_as_stream(self):
        """Test take_response_body_as_stream command."""
        request_id = 'req123'
        result = FetchCommands.take_response_body_as_stream(request_id=request_id)
        
        assert result['method'] == FetchMethod.TAKE_RESPONSE_BODY_AS_STREAM
        assert result['params']['requestId'] == request_id


================================================
FILE: tests/test_commands/test_input_commands.py
================================================
"""
Tests for InputCommands class.

This module contains comprehensive tests for all InputCommands methods,
verifying that they generate the correct CDP commands with proper parameters.
"""

from pydoll.commands.input_commands import InputCommands
from pydoll.protocol.input.types import (
    DragEventType,
    GestureSourceType,
    KeyEventType,
    KeyLocation,
    KeyModifier,
    MouseButton,
    MouseEventType,
    PointerType,
    TouchEventType,
)
from pydoll.protocol.input.methods import InputMethod


def test_cancel_dragging():
    """Test cancel_dragging method generates correct command."""
    expected_command = {
        'method': InputMethod.CANCEL_DRAGGING,
    }
    result = InputCommands.cancel_dragging()
    assert result['method'] == expected_command['method']
    assert 'params' not in result


def test_dispatch_key_event_minimal():
    """Test dispatch_key_event with minimal parameters."""
    expected_command = {
        'method': InputMethod.DISPATCH_KEY_EVENT,
        'params': {
            'type': KeyEventType.KEY_DOWN,
        },
    }
    result = InputCommands.dispatch_key_event(type=KeyEventType.KEY_DOWN)
    assert result['method'] == expected_command['method']
    assert result['params']['type'] == expected_command['params']['type']


def test_dispatch_key_event_with_modifiers():
    """Test dispatch_key_event with modifiers."""
    result = InputCommands.dispatch_key_event(
        type=KeyEventType.KEY_DOWN,
        modifiers=KeyModifier.CTRL | KeyModifier.SHIFT,
        text='A',
    )
    assert result['method'] == InputMethod.DISPATCH_KEY_EVENT
    assert result['params']['type'] == KeyEventType.KEY_DOWN
    assert result['params']['modifiers'] == KeyModifier.CTRL | KeyModifier.SHIFT
    assert result['params']['text'] == 'A'


def test_dispatch_key_event_with_all_params():
    """Test dispatch_key_event with all parameters."""
    result = InputCommands.dispatch_key_event(
        type=KeyEventType.CHAR,
        modifiers=KeyModifier.ALT,
        timestamp=123.456,
        text='a',
        unmodified_text='A',
        key_identifier='U+0041',
        code='KeyA',
        key='a',
        windows_virtual_key_code=65,
        native_virtual_key_code=65,
        auto_repeat=True,
        is_keypad=False,
        is_system_key=False,
        location=KeyLocation.LEFT,
        commands=['selectAll'],
    )
    assert result['method'] == InputMethod.DISPATCH_KEY_EVENT
    assert result['params']['type'] == KeyEventType.CHAR
    assert result['params']['modifiers'] == KeyModifier.ALT
    assert result['params']['timestamp'] == 123.456
    assert result['params']['text'] == 'a'
    assert result['params']['unmodifiedText'] == 'A'
    assert result['params']['keyIdentifier'] == 'U+0041'
    assert result['params']['code'] == 'KeyA'
    assert result['params']['key'] == 'a'
    assert result['params']['windowsVirtualKeyCode'] == 65
    assert result['params']['nativeVirtualKeyCode'] == 65
    assert result['params']['autoRepeat'] is True
    assert result['params']['isKeypad'] is False
    assert result['params']['isSystemKey'] is False
    assert result['params']['location'] == KeyLocation.LEFT
    assert result['params']['commands'] == ['selectAll']


def test_dispatch_mouse_event_minimal():
    """Test dispatch_mouse_event with minimal parameters."""
    result = InputCommands.dispatch_mouse_event(
        type=MouseEventType.MOUSE_PRESSED,
        x=100,
        y=200,
    )
    assert result['method'] == InputMethod.DISPATCH_MOUSE_EVENT
    assert result['params']['type'] == MouseEventType.MOUSE_PRESSED
    assert result['params']['x'] == 100
    assert result['params']['y'] == 200


def test_dispatch_mouse_event_with_button():
    """Test dispatch_mouse_event with button parameter."""
    result = InputCommands.dispatch_mouse_event(
        type=MouseEventType.MOUSE_PRESSED,
        x=100,
        y=200,
        button=MouseButton.LEFT,
        click_count=1,
    )
    assert result['method'] == InputMethod.DISPATCH_MOUSE_EVENT
    assert result['params']['type'] == MouseEventType.MOUSE_PRESSED
    assert result['params']['x'] == 100
    assert result['params']['y'] == 200
    assert result['params']['button'] == MouseButton.LEFT
    assert result['params']['clickCount'] == 1


def test_dispatch_mouse_event_with_all_params():
    """Test dispatch_mouse_event with all parameters."""
    result = InputCommands.dispatch_mouse_event(
        type=MouseEventType.MOUSE_MOVED,
        x=150,
        y=250,
        modifiers=KeyModifier.CTRL,
        timestamp=789.123,
        button=MouseButton.RIGHT,
        click_count=2,
        force=0.5,
        tangential_pressure=0.3,
        tilt_x=15.0,
        tilt_y=20.0,
        twist=45,
        delta_x=10.0,
        delta_y=15.0,
        pointer_type=PointerType.PEN,
    )
    assert result['method'] == InputMethod.DISPATCH_MOUSE_EVENT
    assert result['params']['type'] == MouseEventType.MOUSE_MOVED
    assert result['params']['x'] == 150
    assert result['params']['y'] == 250
    assert result['params']['modifiers'] == KeyModifier.CTRL
    assert result['params']['timestamp'] == 789.123
    assert result['params']['button'] == MouseButton.RIGHT
    assert result['params']['clickCount'] == 2
    assert result['params']['force'] == 0.5
    assert result['params']['tangentialPressure'] == 0.3
    assert result['params']['tiltX'] == 15.0
    assert result['params']['tiltY'] == 20.0
    assert result['params']['twist'] == 45
    assert result['params']['deltaX'] == 10.0
    assert result['params']['deltaY'] == 15.0
    assert result['params']['pointerType'] == PointerType.PEN


def test_dispatch_touch_event_minimal():
    """Test dispatch_touch_event with minimal parameters."""
    result = InputCommands.dispatch_touch_event(
        type=TouchEventType.TOUCH_START,
        touch_points=[],
    )
    assert result['method'] == InputMethod.DISPATCH_TOUCH_EVENT
    assert result['params']['type'] == TouchEventType.TOUCH_START


def test_dispatch_touch_event_with_touch_points():
    """Test dispatch_touch_event with touch points."""
    touch_points = [
        {
            'x': 100,
            'y': 200,
            'radiusX': 10,
            'radiusY': 10,
            'rotationAngle': 0,
            'force': 1.0,
        }
    ]
    result = InputCommands.dispatch_touch_event(
        type=TouchEventType.TOUCH_START,
        touch_points=touch_points,
        modifiers=KeyModifier.SHIFT,
        timestamp=456.789,
    )
    assert result['method'] == InputMethod.DISPATCH_TOUCH_EVENT
    assert result['params']['type'] == TouchEventType.TOUCH_START
    assert result['params']['touchPoints'] == touch_points
    assert result['params']['modifiers'] == KeyModifier.SHIFT
    assert result['params']['timestamp'] == 456.789


def test_set_ignore_input_events():
    """Test set_ignore_input_events"""
    result = InputCommands.set_ignore_input_events(ignore=True)
    assert result['method'] == InputMethod.SET_IGNORE_INPUT_EVENTS
    assert result['params']['ignore'] is True


def test_dispatch_drag_event_minimal():
    """Test dispatch_drag_event with minimal parameters."""
    result = InputCommands.dispatch_drag_event(
        type=DragEventType.DRAG_ENTER,
        x=100,
        y=200,
        data={},
    )
    assert result['method'] == InputMethod.DISPATCH_DRAG_EVENT
    assert result['params']['type'] == DragEventType.DRAG_ENTER
    assert result['params']['x'] == 100
    assert result['params']['y'] == 200


def test_dispatch_drag_event_with_data():
    """Test dispatch_drag_event with drag data."""
    drag_data = {
        'items': [
            {
                'mimeType': 'text/plain',
                'data': 'Hello World',
            }
        ],
        'dragOperationsMask': 1,
    }
    result = InputCommands.dispatch_drag_event(
        type=DragEventType.DROP,
        x=150,
        y=250,
        data=drag_data,
        modifiers=KeyModifier.ALT,
    )
    assert result['method'] == InputMethod.DISPATCH_DRAG_EVENT
    assert result['params']['type'] == DragEventType.DROP
    assert result['params']['x'] == 150
    assert result['params']['y'] == 250
    assert result['params']['data'] == drag_data
    assert result['params']['modifiers'] == KeyModifier.ALT


def test_emulate_touch_from_mouse_event_minimal():
    """Test emulate_touch_from_mouse_event with minimal parameters."""
    result = InputCommands.emulate_touch_from_mouse_event(
        type=MouseEventType.MOUSE_PRESSED,
        x=100,
        y=200,
        button=MouseButton.LEFT,
    )
    assert result['method'] == InputMethod.EMULATE_TOUCH_FROM_MOUSE_EVENT
    assert result['params']['type'] == MouseEventType.MOUSE_PRESSED
    assert result['params']['x'] == 100
    assert result['params']['y'] == 200
    assert result['params']['button'] == MouseButton.LEFT


def test_emulate_touch_from_mouse_event_with_all_params():
    """Test emulate_touch_from_mouse_event with all parameters."""
    result = InputCommands.emulate_touch_from_mouse_event(
        type=MouseEventType.MOUSE_MOVED,
        x=150,
        y=250,
        button=MouseButton.RIGHT,
        timestamp=123.456,
        delta_x=10.0,
        delta_y=15.0,
        modifiers=KeyModifier.CTRL | KeyModifier.SHIFT,
        click_count=2,
    )
    assert result['method'] == InputMethod.EMULATE_TOUCH_FROM_MOUSE_EVENT
    assert result['params']['type'] == MouseEventType.MOUSE_MOVED
    assert result['params']['x'] == 150
    assert result['params']['y'] == 250
    assert result['params']['button'] == MouseButton.RIGHT
    assert result['params']['timestamp'] == 123.456
    assert result['params']['deltaX'] == 10.0
    assert result['params']['deltaY'] == 15.0
    assert result['params']['modifiers'] == KeyModifier.CTRL | KeyModifier.SHIFT
    assert result['params']['clickCount'] == 2


def test_ime_set_composition():
    """Test ime_set_composition method."""
    result = InputCommands.ime_set_composition(
        text='Hello',
        selection_start=0,
        selection_end=5,
    )
    assert result['method'] == InputMethod.IME_SET_COMPOSITION
    assert result['params']['text'] == 'Hello'
    assert result['params']['selectionStart'] == 0
    assert result['params']['selectionEnd'] == 5


def test_ime_set_composition_with_replacement():
    """Test ime_set_composition with replacement parameters."""
    result = InputCommands.ime_set_composition(
        text='World',
        selection_start=0,
        selection_end=5,
        replacement_start=0,
        replacement_end=5,
    )
    assert result['method'] == InputMethod.IME_SET_COMPOSITION
    assert result['params']['text'] == 'World'
    assert result['params']['selectionStart'] == 0
    assert result['params']['selectionEnd'] == 5
    assert result['params']['replacementStart'] == 0
    assert result['params']['replacementEnd'] == 5


def test_insert_text():
    """Test insert_text method."""
    result = InputCommands.insert_text(text='Hello World')
    assert result['method'] == InputMethod.INSERT_TEXT
    assert result['params']['text'] == 'Hello World'


def test_set_intercept_drags_enabled():
    """Test set_intercept_drags with enabled=True."""
    result = InputCommands.set_intercept_drags(enabled=True)
    assert result['method'] == InputMethod.SET_INTERCEPT_DRAGS
    assert result['params']['enabled'] is True


def test_set_intercept_drags_disabled():
    """Test set_intercept_drags with enabled=False."""
    result = InputCommands.set_intercept_drags(enabled=False)
    assert result['method'] == InputMethod.SET_INTERCEPT_DRAGS
    assert result['params']['enabled'] is False


def test_synthesize_pinch_gesture_minimal():
    """Test synthesize_pinch_gesture with minimal parameters."""
    result = InputCommands.synthesize_pinch_gesture(
        x=100,
        y=200,
        scale_factor=2.0,
    )
    assert result['method'] == InputMethod.SYNTHESIZE_PINCH_GESTURE
    assert result['params']['x'] == 100
    assert result['params']['y'] == 200
    assert result['params']['scaleFactor'] == 2.0


def test_synthesize_pinch_gesture_with_all_params():
    """Test synthesize_pinch_gesture with all parameters."""
    result = InputCommands.synthesize_pinch_gesture(
        x=150,
        y=250,
        scale_factor=1.5,
        relative_speed=100,
        gesture_source_type=GestureSourceType.TOUCH,
    )
    assert result['method'] == InputMethod.SYNTHESIZE_PINCH_GESTURE
    assert result['params']['x'] == 150
    assert result['params']['y'] == 250
    assert result['params']['scaleFactor'] == 1.5
    assert result['params']['relativeSpeed'] == 100
    assert result['params']['gestureSourceType'] == GestureSourceType.TOUCH


def test_synthesize_scroll_gesture_minimal():
    """Test synthesize_scroll_gesture with minimal parameters."""
    result = InputCommands.synthesize_scroll_gesture(
        x=100,
        y=200,
    )
    assert result['method'] == InputMethod.SYNTHESIZE_SCROLL_GESTURE
    assert result['params']['x'] == 100
    assert result['params']['y'] == 200


def test_synthesize_scroll_gesture_with_distance():
    """Test synthesize_scroll_gesture with distance parameters."""
    result = InputCommands.synthesize_scroll_gesture(
        x=100,
        y=200,
        x_distance=50.0,
        y_distance=100.0,
    )
    assert result['method'] == InputMethod.SYNTHESIZE_SCROLL_GESTURE
    assert result['params']['x'] == 100
    assert result['params']['y'] == 200
    assert result['params']['xDistance'] == 50.0
    assert result['params']['yDistance'] == 100.0


def test_synthesize_scroll_gesture_with_all_params():
    """Test synthesize_scroll_gesture with all parameters."""
    result = InputCommands.synthesize_scroll_gesture(
        x=150,
        y=250,
        x_distance=75.0,
        y_distance=125.0,
        x_overscroll=10.0,
        y_overscroll=15.0,
        prevent_fling=True,
        speed=500,
        gesture_source_type=GestureSourceType.MOUSE,
        repeat_count=3,
        repeat_delay_ms=100,
        interaction_marker_name='scroll_test',
    )
    assert result['method'] == InputMethod.SYNTHESIZE_SCROLL_GESTURE
    assert result['params']['x'] == 150
    assert result['params']['y'] == 250
    assert result['params']['xDistance'] == 75.0
    assert result['params']['yDistance'] == 125.0
    assert result['params']['xOverscroll'] == 10.0
    assert result['params']['yOverscroll'] == 15.0
    assert result['params']['preventFling'] is True
    assert result['params']['speed'] == 500
    assert result['params']['gestureSourceType'] == GestureSourceType.MOUSE
    assert result['params']['repeatCount'] == 3
    assert result['params']['repeatDelayMs'] == 100
    assert result['params']['interactionMarkerName'] == 'scroll_test'


def test_synthesize_tap_gesture_minimal():
    """Test synthesize_tap_gesture with minimal parameters."""
    result = InputCommands.synthesize_tap_gesture(
        x=100,
        y=200,
    )
    assert result['method'] == InputMethod.SYNTHESIZE_TAP_GESTURE
    assert result['params']['x'] == 100
    assert result['params']['y'] == 200


def test_synthesize_tap_gesture_with_all_params():
    """Test synthesize_tap_gesture with all parameters."""
    result = InputCommands.synthesize_tap_gesture(
        x=150,
        y=250,
        duration=500,
        tap_count=2,
        gesture_source_type=GestureSourceType.TOUCH,
    )
    assert result['method'] == InputMethod.SYNTHESIZE_TAP_GESTURE
    assert result['params']['x'] == 150
    assert result['params']['y'] == 250
    assert result['params']['duration'] == 500
    assert result['params']['tapCount'] == 2
    assert result['params']['gestureSourceType'] == GestureSourceType.TOUCH


def test_mouse_wheel_event():
    """Test mouse wheel event dispatch."""
    result = InputCommands.dispatch_mouse_event(
        type=MouseEventType.MOUSE_WHEEL,
        x=100,
        y=200,
        delta_x=10.0,
        delta_y=-20.0,
    )
    assert result['method'] == InputMethod.DISPATCH_MOUSE_EVENT
    assert result['params']['type'] == MouseEventType.MOUSE_WHEEL
    assert result['params']['x'] == 100
    assert result['params']['y'] == 200
    assert result['params']['deltaX'] == 10.0
    assert result['params']['deltaY'] == -20.0


def test_key_event_with_location():
    """Test key event with location parameter."""
    result = InputCommands.dispatch_key_event(
        type=KeyEventType.KEY_DOWN,
        key='Shift',
        location=KeyLocation.LEFT,
    )
    assert result['method'] == InputMethod.DISPATCH_KEY_EVENT
    assert result['params']['type'] == KeyEventType.KEY_DOWN
    assert result['params']['key'] == 'Shift'
    assert result['params']['location'] == KeyLocation.LEFT


def test_touch_event_multiple_points():
    """Test touch event with multiple touch points."""
    touch_points = [
        {
            'x': 100,
            'y': 200,
            'radiusX': 10,
            'radiusY': 10,
            'rotationAngle': 0,
            'force': 1.0,
        },
        {
            'x': 300,
            'y': 400,
            'radiusX': 15,
            'radiusY': 15,
            'rotationAngle': 45,
            'force': 0.8,
        },
    ]
    result = InputCommands.dispatch_touch_event(
        type=TouchEventType.TOUCH_MOVE,
        touch_points=touch_points,
    )
    assert result['method'] == InputMethod.DISPATCH_TOUCH_EVENT
    assert result['params']['type'] == TouchEventType.TOUCH_MOVE
    assert result['params']['touchPoints'] == touch_points
    assert len(result['params']['touchPoints']) == 2


def test_drag_event_cancel():
    """Test drag cancel event."""
    result = InputCommands.dispatch_drag_event(
        type=DragEventType.DRAG_CANCEL,
        x=100,
        y=200,
        data={},
    )
    assert result['method'] == InputMethod.DISPATCH_DRAG_EVENT
    assert result['params']['type'] == DragEventType.DRAG_CANCEL
    assert result['params']['x'] == 100
    assert result['params']['y'] == 200


================================================
FILE: tests/test_commands/test_network_commands.py
================================================
"""
Tests for NetworkCommands class.

This module contains comprehensive tests for all NetworkCommands methods,
verifying that they generate the correct CDP commands with proper parameters.
"""

from pydoll.commands.network_commands import NetworkCommands
from pydoll.protocol.network.types import ConnectionType, ContentEncoding, CookiePriority, CookieSameSite, CookieSourceScheme
from pydoll.protocol.network.methods import NetworkMethod


def test_clear_browser_cache():
    """Test clear_browser_cache method generates correct command."""
    result = NetworkCommands.clear_browser_cache()
    assert result['method'] == NetworkMethod.CLEAR_BROWSER_CACHE
    assert 'params' not in result


def test_clear_browser_cookies():
    """Test clear_browser_cookies method generates correct command."""
    result = NetworkCommands.clear_browser_cookies()
    assert result['method'] == NetworkMethod.CLEAR_BROWSER_COOKIES
    assert 'params' not in result


def test_delete_cookies_minimal():
    """Test delete_cookies with minimal parameters."""
    result = NetworkCommands.delete_cookies(name='test_cookie')
    assert result['method'] == NetworkMethod.DELETE_COOKIES
    assert result['params']['name'] == 'test_cookie'


def test_delete_cookies_with_url():
    """Test delete_cookies with URL parameter."""
    result = NetworkCommands.delete_cookies(
        name='test_cookie',
        url='https://example.com'
    )
    assert result['method'] == NetworkMethod.DELETE_COOKIES
    assert result['params']['name'] == 'test_cookie'
    assert result['params']['url'] == 'https://example.com'


def test_delete_cookies_with_all_params():
    """Test delete_cookies with all parameters."""
    partition_key = {
        'topLevelSite': 'https://example.com',
        'hasCrossSiteAncestor': False
    }
    result = NetworkCommands.delete_cookies(
        name='test_cookie',
        url='https://example.com',
        domain='example.com',
        path='/test',
        partition_key=partition_key
    )
    assert result['method'] == NetworkMethod.DELETE_COOKIES
    assert result['params']['name'] == 'test_cookie'
    assert result['params']['url'] == 'https://example.com'
    assert result['params']['domain'] == 'example.com'
    assert result['params']['path'] == '/test'
    assert result['params']['partitionKey'] == partition_key


def test_disable():
    """Test disable method generates correct command."""
    result = NetworkCommands.disable()
    assert result['method'] == NetworkMethod.DISABLE
    assert 'params' not in result


def test_enable_minimal():
    """Test enable with minimal parameters."""
    result = NetworkCommands.enable()
    assert result['method'] == NetworkMethod.ENABLE
    assert result['params'] == {}


def test_enable_with_buffer_sizes():
    """Test enable with buffer size parameters."""
    result = NetworkCommands.enable(
        max_total_buffer_size=1024000,
        max_resource_buffer_size=512000,
        max_post_data_size=65536
    )
    assert result['method'] == NetworkMethod.ENABLE
    assert result['params']['maxTotalBufferSize'] == 1024000
    assert result['params']['maxResourceBufferSize'] == 512000
    assert result['params']['maxPostDataSize'] == 65536


def test_get_cookies_minimal():
    """Test get_cookies with minimal parameters."""
    result = NetworkCommands.get_cookies()
    assert result['method'] == NetworkMethod.GET_COOKIES
    assert result['params'] == {}


def test_get_cookies_with_urls():
    """Test get_cookies with URLs parameter."""
    urls = ['https://example.com', 'https://test.com']
    result = NetworkCommands.get_cookies(urls=urls)
    assert result['method'] == NetworkMethod.GET_COOKIES
    assert result['params']['urls'] == urls


def test_get_request_post_data():
    """Test get_request_post_data method."""
    result = NetworkCommands.get_request_post_data(request_id='12345')
    assert result['method'] == NetworkMethod.GET_REQUEST_POST_DATA
    assert result['params']['requestId'] == '12345'


def test_get_response_body():
    """Test get_response_body method."""
    result = NetworkCommands.get_response_body(request_id='12345')
    assert result['method'] == NetworkMethod.GET_RESPONSE_BODY
    assert result['params']['requestId'] == '12345'


def test_set_cache_disabled_true():
    """Test set_cache_disabled with cache disabled."""
    result = NetworkCommands.set_cache_disabled(cache_disabled=True)
    assert result['method'] == NetworkMethod.SET_CACHE_DISABLED
    assert result['params']['cacheDisabled'] is True


def test_set_cache_disabled_false():
    """Test set_cache_disabled with cache enabled."""
    result = NetworkCommands.set_cache_disabled(cache_disabled=False)
    assert result['method'] == NetworkMethod.SET_CACHE_DISABLED
    assert result['params']['cacheDisabled'] is False


def test_set_cookie_minimal():
    """Test set_cookie with minimal parameters."""
    result = NetworkCommands.set_cookie(name='test', value='value')
    assert result['method'] == NetworkMethod.SET_COOKIE
    assert result['params']['name'] == 'test'
    assert result['params']['value'] == 'value'


def test_set_cookie_with_url():
    """Test set_cookie with URL parameter."""
    result = NetworkCommands.set_cookie(
        name='test',
        value='value',
        url='https://example.com'
    )
    assert result['method'] == NetworkMethod.SET_COOKIE
    assert result['params']['name'] == 'test'
    assert result['params']['value'] == 'value'
    assert result['params']['url'] == 'https://example.com'


def test_set_cookie_with_all_params():
    """Test set_cookie with all parameters."""
    partition_key = {
        'topLevelSite': 'https://example.com',
        'hasCrossSiteAncestor': False
    }
    result = NetworkCommands.set_cookie(
        name='test',
        value='value',
        url='https://example.com',
        domain='example.com',
        path='/test',
        secure=True,
        http_only=True,
        same_site=CookieSameSite.STRICT,
        expires=1234567890.0,
        priority=CookiePriority.HIGH,
        same_party=True,
        source_scheme=CookieSourceScheme.SECURE,
        source_port=443,
        partition_key=partition_key
    )
    assert result['method'] == NetworkMethod.SET_COOKIE
    assert result['params']['name'] == 'test'
    assert result['params']['value'] == 'value'
    assert result['params']['url'] == 'https://example.com'
    assert result['params']['domain'] == 'example.com'
    assert result['params']['path'] == '/test'
    assert result['params']['secure'] is True
    assert result['params']['httpOnly'] is True
    assert result['params']['sameSite'] == CookieSameSite.STRICT
    assert result['params']['expires'] == 1234567890.0
    assert result['params']['priority'] == CookiePriority.HIGH
    assert result['params']['sameParty'] is True
    assert result['params']['sourceScheme'] == CookieSourceScheme.SECURE
    assert result['params']['sourcePort'] == 443
    assert result['params']['partitionKey'] == partition_key


def test_set_cookies():
    """Test set_cookies method."""
    cookies = [
        {
            'name': 'cookie1',
            'value': 'value1',
            'url': 'https://example.com'
        },
        {
            'name': 'cookie2',
            'value': 'value2',
            'domain': 'example.com'
        }
    ]
    result = NetworkCommands.set_cookies(cookies=cookies)
    assert result['method'] == NetworkMethod.SET_COOKIES
    assert result['params']['cookies'] == cookies


def test_set_extra_http_headers():
    """Test set_extra_http_headers method."""
    headers = [
        {'name': 'Authorization', 'value': 'Bearer token123'},
        {'name': 'X-Custom-Header', 'value': 'custom-value'}
    ]
    result = NetworkCommands.set_extra_http_headers(headers=headers)
    assert result['method'] == NetworkMethod.SET_EXTRA_HTTP_HEADERS
    assert result['params']['headers'] == headers


def test_set_useragent_override_minimal():
    """Test set_useragent_override with minimal parameters."""
    user_agent = 'Mozilla/5.0 (Custom Browser)'
    result = NetworkCommands.set_useragent_override(user_agent=user_agent)
    assert result['method'] == NetworkMethod.SET_USER_AGENT_OVERRIDE
    assert result['params']['userAgent'] == user_agent


def test_set_useragent_override_with_all_params():
    """Test set_useragent_override with all parameters."""
    user_agent = 'Mozilla/5.0 (Custom Browser)'
    accept_language = 'en-US,en;q=0.9'
    platform = 'Linux x86_64'
    user_agent_metadata = {
        'brands': [{'brand': 'Custom', 'version': '1.0'}],
        'fullVersionList': [{'brand': 'Custom', 'version': '1.0.0'}],
        'platform': 'Linux',
        'platformVersion': '5.4.0',
        'architecture': 'x86',
        'model': '',
        'mobile': False,
        'bitness': '64',
        'wow64': False
    }
    result = NetworkCommands.set_useragent_override(
        user_agent=user_agent,
        accept_language=accept_language,
        platform=platform,
        user_agent_metadata=user_agent_metadata
    )
    assert result['method'] == NetworkMethod.SET_USER_AGENT_OVERRIDE
    assert result['params']['userAgent'] == user_agent
    assert result['params']['acceptLanguage'] == accept_language
    assert result['params']['platform'] == platform
    assert result['params']['userAgentMetadata'] == user_agent_metadata


def test_clear_accepted_encodings_override():
    """Test clear_accepted_encodings_override method."""
    result = NetworkCommands.clear_accepted_encodings_override()
    assert result['method'] == NetworkMethod.CLEAR_ACCEPTED_ENCODINGS_OVERRIDE
    assert 'params' not in result


def test_enable_reporting_api():
    """Test enable_reporting_api method."""
    result = NetworkCommands.enable_reporting_api(enabled=True)
    assert result['method'] == NetworkMethod.ENABLE_REPORTING_API
    assert result['params']['enabled'] is True


def test_search_in_response_body_minimal():
    """Test search_in_response_body with minimal parameters."""
    result = NetworkCommands.search_in_response_body(
        request_id='12345',
        query='test'
    )
    assert result['method'] == NetworkMethod.SEARCH_IN_RESPONSE_BODY
    assert result['params']['requestId'] == '12345'
    assert result['params']['query'] == 'test'
    assert result['params']['caseSensitive'] is False
    assert result['params']['isRegex'] is False


def test_search_in_response_body_with_options():
    """Test search_in_response_body with all options."""
    result = NetworkCommands.search_in_response_body(
        request_id='12345',
        query='test.*pattern',
        case_sensitive=True,
        is_regex=True
    )
    assert result['method'] == NetworkMethod.SEARCH_IN_RESPONSE_BODY
    assert result['params']['requestId'] == '12345'
    assert result['params']['query'] == 'test.*pattern'
    assert result['params']['caseSensitive'] is True
    assert result['params']['isRegex'] is True


def test_set_blocked_urls():
    """Test set_blocked_urls method."""
    urls = ['https://ads.example.com', 'https://tracker.com']
    result = NetworkCommands.set_blocked_urls(urls=urls)
    assert result['method'] == NetworkMethod.SET_BLOCKED_URLS
    assert result['params']['urls'] == urls


def test_set_bypass_service_worker():
    """Test set_bypass_service_worker method."""
    result = NetworkCommands.set_bypass_service_worker(bypass=True)
    assert result['method'] == NetworkMethod.SET_BYPASS_SERVICE_WORKER
    assert result['params']['bypass'] is True


def test_get_certificate():
    """Test get_certificate method."""
    result = NetworkCommands.get_certificate(origin='https://example.com')
    assert result['method'] == NetworkMethod.GET_CERTIFICATE
    assert result['params']['origin'] == 'https://example.com'


def test_get_response_body_for_interception():
    """Test get_response_body_for_interception method."""
    result = NetworkCommands.get_response_body_for_interception(
        interception_id='interception123'
    )
    assert result['method'] == NetworkMethod.GET_RESPONSE_BODY_FOR_INTERCEPTION
    assert result['params']['interceptionId'] == 'interception123'


def test_set_accepted_encodings():
    """Test set_accepted_encodings method."""
    encodings = [ContentEncoding.GZIP, ContentEncoding.BR]
    result = NetworkCommands.set_accepted_encodings(encodings=encodings)
    assert result['method'] == NetworkMethod.SET_ACCEPTED_ENCODINGS
    assert result['params']['encodings'] == encodings


def test_set_attach_debug_stack():
    """Test set_attach_debug_stack method."""
    result = NetworkCommands.set_attach_debug_stack(enabled=True)
    assert result['method'] == NetworkMethod.SET_ATTACH_DEBUG_STACK
    assert result['params']['enabled'] is True


def test_set_cookie_controls_minimal():
    """Test set_cookie_controls with minimal parameters."""
    result = NetworkCommands.set_cookie_controls(
        enable_third_party_cookie_restriction=True
    )
    assert result['method'] == NetworkMethod.SET_COOKIE_CONTROLS
    assert result['params']['enableThirdPartyCookieRestriction'] is True


def test_set_cookie_controls_with_all_params():
    """Test set_cookie_controls with all parameters."""
    result = NetworkCommands.set_cookie_controls(
        enable_third_party_cookie_restriction=True,
        disable_third_party_cookie_metadata=False,
        disable_third_party_cookie_heuristics=True
    )
    assert result['method'] == NetworkMethod.SET_COOKIE_CONTROLS
    assert result['params']['enableThirdPartyCookieRestriction'] is True
    assert result['params']['disableThirdPartyCookieMetadata'] is False
    assert result['params']['disableThirdPartyCookieHeuristics'] is True


def test_stream_resource_content():
    """Test stream_resource_content method."""
    result = NetworkCommands.stream_resource_content(request_id='12345')
    assert result['method'] == NetworkMethod.STREAM_RESOURCE_CONTENT
    assert result['params']['requestId'] == '12345'


def test_take_response_body_for_interception_as_stream():
    """Test take_response_body_for_interception_as_stream method."""
    result = NetworkCommands.take_response_body_for_interception_as_stream(
        interception_id='interception123'
    )
    assert result['method'] == NetworkMethod.TAKE_RESPONSE_BODY_FOR_INTERCEPTION_AS_STREAM
    assert result['params']['interceptionId'] == 'interception123'


def test_emulate_network_conditions_minimal():
    """Test emulate_network_conditions with minimal parameters."""
    result = NetworkCommands.emulate_network_conditions(
        offline=False,
        latency=100.0,
        download_throughput=1000000.0,
        upload_throughput=500000.0
    )
    assert result['method'] == NetworkMethod.EMULATE_NETWORK_CONDITIONS
    assert result['params']['offline'] is False
    assert result['params']['latency'] == 100.0
    assert result['params']['downloadThroughput'] == 1000000.0
    assert result['params']['uploadThroughput'] == 500000.0


def test_emulate_network_conditions_with_all_params():
    """Test emulate_network_conditions with all parameters."""
    result = NetworkCommands.emulate_network_conditions(
        offline=False,
        latency=200.0,
        download_throughput=2000000.0,
        upload_throughput=1000000.0,
        connection_type=ConnectionType.CELLULAR4G,
        packet_loss=0.1,
        packet_queue_length=100,
        packet_reordering=True
    )
    assert result['method'] == NetworkMethod.EMULATE_NETWORK_CONDITIONS
    assert result['params']['offline'] is False
    assert result['params']['latency'] == 200.0
    assert result['params']['downloadThroughput'] == 2000000.0
    assert result['params']['uploadThroughput'] == 1000000.0
    assert result['params']['connectionType'] == ConnectionType.CELLULAR4G
    assert result['params']['packetLoss'] == 0.1
    assert result['params']['packetQueueLength'] == 100
    assert result['params']['packetReordering'] is True


def test_get_security_isolation_status_minimal():
    """Test get_security_isolation_status with minimal parameters."""
    result = NetworkCommands.get_security_isolation_status()
    assert result['method'] == NetworkMethod.GET_SECURITY_ISOLATION_STATUS
    assert result['params'] == {}


def test_get_security_isolation_status_with_frame_id():
    """Test get_security_isolation_status with frame ID."""
    result = NetworkCommands.get_security_isolation_status(frame_id='frame123')
    assert result['method'] == NetworkMethod.GET_SECURITY_ISOLATION_STATUS
    assert result['params']['frameId'] == 'frame123'


def test_load_network_resource():
    """Test load_network_resource method."""
    options = {
        'disableCache': True,
        'includeCredentials': False
    }
    result = NetworkCommands.load_network_resource(
        url='https://example.com/resource',
        options=options
    )
    assert result['method'] == NetworkMethod.LOAD_NETWORK_RESOURCE
    assert result['params']['url'] == 'https://example.com/resource'
    assert result['params']['options'] == options


def test_load_network_resource_with_frame_id():
    """Test load_network_resource with frame ID."""
    options = {
        'disableCache': False,
        'includeCredentials': True
    }
    result = NetworkCommands.load_network_resource(
        url='https://example.com/resource',
        options=options,
        frame_id='frame123'
    )
    assert result['method'] == NetworkMethod.LOAD_NETWORK_RESOURCE
    assert result['params']['url'] == 'https://example.com/resource'
    assert result['params']['options'] == options
    assert result['params']['frameId'] == 'frame123'


def test_replay_xhr():
    """Test replay_xhr method."""
    result = NetworkCommands.replay_xhr(request_id='12345')
    assert result['method'] == NetworkMethod.REPLAY_XHR
    assert result['params']['requestId'] == '12345'


================================================
FILE: tests/test_commands/test_page_commands.py
================================================
"""
Tests for PageCommands class.

This module contains comprehensive tests for all PageCommands methods,
verifying that they generate the correct CDP commands with proper parameters.
"""

from pydoll.commands.page_commands import PageCommands
from pydoll.protocol.page.types import (
    ReferrerPolicy,
    ScreencastFormat,
    ScreenshotFormat,
    TransferMode,
    TransitionType,
    WebLifecycleState,
)
from pydoll.protocol.page.methods import PageMethod


def test_add_script_to_evaluate_on_new_document_minimal():
    """Test add_script_to_evaluate_on_new_document with minimal parameters."""
    result = PageCommands.add_script_to_evaluate_on_new_document(
        source='console.log("Hello World");'
    )
    assert result['method'] == PageMethod.ADD_SCRIPT_TO_EVALUATE_ON_NEW_DOCUMENT
    assert result['params']['source'] == 'console.log("Hello World");'


def test_add_script_to_evaluate_on_new_document_with_all_params():
    """Test add_script_to_evaluate_on_new_document with all parameters."""
    result = PageCommands.add_script_to_evaluate_on_new_document(
        source='console.log("Test");',
        world_name='test_world',
        include_command_line_api=True,
        run_immediately=False
    )
    assert result['method'] == PageMethod.ADD_SCRIPT_TO_EVALUATE_ON_NEW_DOCUMENT
    assert result['params']['source'] == 'console.log("Test");'
    assert result['params']['worldName'] == 'test_world'
    assert result['params']['includeCommandLineAPI'] is True
    assert result['params']['runImmediately'] is False


def test_bring_to_front():
    """Test bring_to_front method generates correct command."""
    result = PageCommands.bring_to_front()
    assert result['method'] == PageMethod.BRING_TO_FRONT
    assert 'params' not in result


def test_capture_screenshot_minimal():
    """Test capture_screenshot with minimal parameters."""
    result = PageCommands.capture_screenshot()
    assert result['method'] == PageMethod.CAPTURE_SCREENSHOT
    assert result['params'] == {}


def test_capture_screenshot_with_format_and_quality():
    """Test capture_screenshot with format and quality."""
    result = PageCommands.capture_screenshot(
        format=ScreenshotFormat.JPEG,
        quality=80
    )
    assert result['method'] == PageMethod.CAPTURE_SCREENSHOT
    assert result['params']['format'] == ScreenshotFormat.JPEG
    assert result['params']['quality'] == 80


def test_capture_screenshot_with_clip():
    """Test capture_screenshot with clip viewport."""
    clip = {
        'x': 10,
        'y': 20,
        'width': 100,
        'height': 200,
        'scale': 1.0
    }
    result = PageCommands.capture_screenshot(
        format=ScreenshotFormat.PNG,
        clip=clip
    )
    assert result['method'] == PageMethod.CAPTURE_SCREENSHOT
    assert result['params']['format'] == ScreenshotFormat.PNG
    assert result['params']['clip'] == clip


def test_capture_screenshot_with_all_params():
    """Test capture_screenshot with all parameters."""
    clip = {
        'x': 0,
        'y': 0,
        'width': 1920,
        'height': 1080,
        'scale': 1.0
    }
    result = PageCommands.capture_screenshot(
        format=ScreenshotFormat.WEBP,
        quality=90,
        clip=clip,
        from_surface=True,
        capture_beyond_viewport=False,
        optimize_for_speed=True
    )
    assert result['method'] == PageMethod.CAPTURE_SCREENSHOT
    assert result['params']['format'] == ScreenshotFormat.WEBP
    assert result['params']['quality'] == 90
    assert result['params']['clip'] == clip
    assert result['params']['fromSurface'] is True
    assert result['params']['captureBeyondViewport'] is False
    assert result['params']['optimizeForSpeed'] is True


def test_close():
    """Test close method generates correct command."""
    result = PageCommands.close()
    assert result['method'] == PageMethod.CLOSE
    assert 'params' not in result


def test_create_isolated_world_minimal():
    """Test create_isolated_world with minimal parameters."""
    result = PageCommands.create_isolated_world(frame_id='frame123')
    assert result['method'] == PageMethod.CREATE_ISOLATED_WORLD
    assert result['params']['frameId'] == 'frame123'


def test_create_isolated_world_with_all_params():
    """Test create_isolated_world with all parameters."""
    result = PageCommands.create_isolated_world(
        frame_id='frame123',
        world_name='test_world',
        grant_universal_access=True
    )
    assert result['method'] == PageMethod.CREATE_ISOLATED_WORLD
    assert result['params']['frameId'] == 'frame123'
    assert result['params']['worldName'] == 'test_world'
    assert result['params']['grantUniveralAccess'] is True


def test_disable():
    """Test disable method generates correct command."""
    result = PageCommands.disable()
    assert result['method'] == PageMethod.DISABLE
    assert 'params' not in result


def test_enable_minimal():
    """Test enable with minimal parameters."""
    result = PageCommands.enable()
    assert result['method'] == PageMethod.ENABLE
    assert result['params'] == {}


def test_enable_with_file_chooser():
    """Test enable with file chooser event enabled."""
    result = PageCommands.enable(enable_file_chooser_opened_event=True)
    assert result['method'] == PageMethod.ENABLE
    assert result['params']['enableFileChooserOpenedEvent'] is True


def test_get_app_manifest_minimal():
    """Test get_app_manifest with minimal parameters."""
    result = PageCommands.get_app_manifest()
    assert result['method'] == PageMethod.GET_APP_MANIFEST
    assert result['params'] == {}


def test_get_app_manifest_with_id():
    """Test get_app_manifest with manifest ID."""
    result = PageCommands.get_app_manifest(manifest_id='manifest123')
    assert result['method'] == PageMethod.GET_APP_MANIFEST
    assert result['params']['manifestId'] == 'manifest123'


def test_get_frame_tree():
    """Test get_frame_tree method generates correct command."""
    result = PageCommands.get_frame_tree()
    assert result['method'] == PageMethod.GET_FRAME_TREE
    assert 'params' not in result


def test_get_layout_metrics():
    """Test get_layout_metrics method generates correct command."""
    result = PageCommands.get_layout_metrics()
    assert result['method'] == PageMethod.GET_LAYOUT_METRICS
    assert 'params' not in result


def test_get_navigation_history():
    """Test get_navigation_history method generates correct command."""
    result = PageCommands.get_navigation_history()
    assert result['method'] == PageMethod.GET_NAVIGATION_HISTORY
    assert 'params' not in result


def test_handle_javascript_dialog_accept():
    """Test handle_javascript_dialog with accept."""
    result = PageCommands.handle_javascript_dialog(accept=True)
    assert result['method'] == PageMethod.HANDLE_JAVASCRIPT_DIALOG
    assert result['params']['accept'] is True


def test_handle_javascript_dialog_with_prompt():
    """Test handle_javascript_dialog with prompt text."""
    result = PageCommands.handle_javascript_dialog(
        accept=True,
        prompt_text='test input'
    )
    assert result['method'] == PageMethod.HANDLE_JAVASCRIPT_DIALOG
    assert result['params']['accept'] is True
    assert result['params']['promptText'] == 'test input'


def test_navigate_minimal():
    """Test navigate with minimal parameters."""
    result = PageCommands.navigate(url='https://example.com')
    assert result['method'] == PageMethod.NAVIGATE
    assert result['params']['url'] == 'https://example.com'


def test_navigate_with_all_params():
    """Test navigate with all parameters."""
    result = PageCommands.navigate(
        url='https://example.com',
        referrer='https://google.com',
        transition_type=TransitionType.LINK,
        frame_id='frame123',
        referrer_policy=ReferrerPolicy.STRICT_ORIGIN
    )
    assert result['method'] == PageMethod.NAVIGATE
    assert result['params']['url'] == 'https://example.com'
    assert result['params']['referrer'] == 'https://google.com'
    assert result['params']['transitionType'] == TransitionType.LINK
    assert result['params']['frameId'] == 'frame123'
    assert result['params']['referrerPolicy'] == ReferrerPolicy.STRICT_ORIGIN


def test_navigate_to_history_entry():
    """Test navigate_to_history_entry method."""
    result = PageCommands.navigate_to_history_entry(entry_id=5)
    assert result['method'] == PageMethod.NAVIGATE_TO_HISTORY_ENTRY
    assert result['params']['entryId'] == 5


def test_print_to_pdf_minimal():
    """Test print_to_pdf with minimal parameters."""
    result = PageCommands.print_to_pdf()
    assert result['method'] == PageMethod.PRINT_TO_PDF
    assert result['params'] == {}


def test_print_to_pdf_with_basic_params():
    """Test print_to_pdf with basic parameters."""
    result = PageCommands.print_to_pdf(
        landscape=True,
        scale=1.5,
        paper_width=8.5,
        paper_height=11.0
    )
    assert result['method'] == PageMethod.PRINT_TO_PDF
    assert result['params']['landscape'] is True
    assert result['params']['scale'] == 1.5
    assert result['params']['paperWidth'] == 8.5
    assert result['params']['paperHeight'] == 11.0


def test_print_to_pdf_with_all_params():
    """Test print_to_pdf with all parameters."""
    result = PageCommands.print_to_pdf(
        landscape=False,
        display_header_footer=True,
        print_background=True,
        scale=1.0,
        paper_width=8.5,
        paper_height=11.0,
        margin_top=0.5,
        margin_bottom=0.5,
        margin_left=0.5,
        margin_right=0.5,
        page_ranges='1-5',
        header_template='<div>Header</div>',
        footer_template='<div>Footer</div>',
        prefer_css_page_size=True,
        transfer_mode=TransferMode.RETURN_AS_BASE64,
        generate_tagged_pdf=True,
        generate_document_outline=False
    )
    assert result['method'] == PageMethod.PRINT_TO_PDF
    assert result['params']['landscape'] is False
    assert result['params']['displayHeaderFooter'] is True
    assert result['params']['printBackground'] is True
    assert result['params']['scale'] == 1.0
    assert result['params']['paperWidth'] == 8.5
    assert result['params']['paperHeight'] == 11.0
    assert result['params']['marginTop'] == 0.5
    assert result['params']['marginBottom'] == 0.5
    assert result['params']['marginLeft'] == 0.5
    assert result['params']['marginRight'] == 0.5
    assert result['params']['pageRanges'] == '1-5'
    assert result['params']['headerTemplate'] == '<div>Header</div>'
    assert result['params']['footerTemplate'] == '<div>Footer</div>'
    assert result['params']['preferCSSPageSize'] is True
    assert result['params']['transferMode'] == TransferMode.RETURN_AS_BASE64
    assert result['params']['generateTaggedPDF'] is True
    assert result['params']['generateDocumentOutline'] is False


def test_reload_minimal():
    """Test reload with minimal parameters."""
    result = PageCommands.reload()
    assert result['method'] == PageMethod.RELOAD
    assert result['params'] == {}


def test_reload_with_all_params():
    """Test reload with all parameters."""
    result = PageCommands.reload(
        ignore_cache=True,
        script_to_evaluate_on_load='console.log("reloaded");',
        loader_id='loader123'
    )
    assert result['method'] == PageMethod.RELOAD
    assert result['params']['ignoreCache'] is True
    assert result['params']['scriptToEvaluateOnLoad'] == 'console.log("reloaded");'
    assert result['params']['loaderId'] == 'loader123'


def test_reset_navigation_history():
    """Test reset_navigation_history method generates correct command."""
    result = PageCommands.reset_navigation_history()
    assert result['method'] == PageMethod.RESET_NAVIGATION_HISTORY
    assert 'params' not in result


def test_remove_script_to_evaluate_on_new_document():
    """Test remove_script_to_evaluate_on_new_document method."""
    result = PageCommands.remove_script_to_evaluate_on_new_document(
        identifier='script123'
    )
    assert result['method'] == PageMethod.REMOVE_SCRIPT_TO_EVALUATE_ON_NEW_DOCUMENT
    assert result['params']['identifier'] == 'script123'


def test_set_bypass_csp():
    """Test set_bypass_csp method."""
    result = PageCommands.set_bypass_csp(enabled=True)
    assert result['method'] == PageMethod.SET_BYPASS_CSP
    assert result['params']['enabled'] is True


def test_set_document_content():
    """Test set_document_content method."""
    result = PageCommands.set_document_content(
        frame_id='frame123',
        html='<html><body>Test</body></html>'
    )
    assert result['method'] == PageMethod.SET_DOCUMENT_CONTENT
    assert result['params']['frameId'] == 'frame123'
    assert result['params']['html'] == '<html><body>Test</body></html>'


def test_set_intercept_file_chooser_dialog():
    """Test set_intercept_file_chooser_dialog method."""
    result = PageCommands.set_intercept_file_chooser_dialog(enabled=True)
    assert result['method'] == PageMethod.SET_INTERCEPT_FILE_CHOOSER_DIALOG
    assert result['params']['enabled'] is True


def test_set_lifecycle_events_enabled():
    """Test set_lifecycle_events_enabled method."""
    result = PageCommands.set_lifecycle_events_enabled(enabled=True)
    assert result['method'] == PageMethod.SET_LIFECYCLE_EVENTS_ENABLED
    assert result['params']['enabled'] is True


def test_stop_loading():
    """Test stop_loading method generates correct command."""
    result = PageCommands.stop_loading()
    assert result['method'] == PageMethod.STOP_LOADING
    assert 'params' not in result


def test_add_compilation_cache():
    """Test add_compilation_cache method."""
    result = PageCommands.add_compilation_cache(
        url='https://example.com/script.js',
        data='compiled_data_here'
    )
    assert result['method'] == PageMethod.ADD_COMPILATION_CACHE
    assert result['params']['url'] == 'https://example.com/script.js'
    assert result['params']['data'] == 'compiled_data_here'


def test_capture_snapshot():
    """Test capture_snapshot method."""
    result = PageCommands.capture_snapshot(format='mhtml')
    assert result['method'] == PageMethod.CAPTURE_SNAPSHOT
    assert result['params']['format'] == 'mhtml'


def test_clear_compilation_cache():
    """Test clear_compilation_cache method generates correct command."""
    result = PageCommands.clear_compilation_cache()
    assert result['method'] == PageMethod.CLEAR_COMPILATION_CACHE
    assert 'params' not in result


def test_crash():
    """Test crash method generates correct command."""
    result = PageCommands.crash()
    assert result['method'] == PageMethod.CRASH
    assert 'params' not in result


def test_generate_test_report_minimal():
    """Test generate_test_report with minimal parameters."""
    result = PageCommands.generate_test_report(message='Test message')
    assert result['method'] == PageMethod.GENERATE_TEST_REPORT
    assert result['params']['message'] == 'Test message'


def test_generate_test_report_with_group():
    """Test generate_test_report with group parameter."""
    result = PageCommands.generate_test_report(
        message='Test message',
        group='test_group'
    )
    assert result['method'] == PageMethod.GENERATE_TEST_REPORT
    assert result['params']['message'] == 'Test message'
    assert result['params']['group'] == 'test_group'


def test_get_ad_script_ancestry_ids():
    """Test get_ad_script_ancestry_ids method."""
    result = PageCommands.get_ad_script_ancestry_ids(frame_id='frame123')
    assert result['method'] == PageMethod.GET_AD_SCRIPT_ANCESTRY_IDS
    assert result['params']['frameId'] == 'frame123'


def test_get_app_id_minimal():
    """Test get_app_id with minimal parameters."""
    result = PageCommands.get_app_id()
    assert result['method'] == PageMethod.GET_APP_ID
    assert result['params'] == {}


def test_get_app_id_with_params():
    """Test get_app_id with parameters."""
    result = PageCommands.get_app_id(
        app_id='app123',
        recommended_id='rec456'
    )
    assert result['method'] == PageMethod.GET_APP_ID
    assert result['params']['appId'] == 'app123'
    assert result['params']['recommendedId'] == 'rec456'


def test_get_installability_errors():
    """Test get_installability_errors method generates correct command."""
    result = PageCommands.get_installability_errors()
    assert result['method'] == PageMethod.GET_INSTALLABILITY_ERRORS
    assert 'params' not in result


def test_get_origin_trials():
    """Test get_origin_trials method."""
    result = PageCommands.get_origin_trials(frame_id='frame123')
    assert result['method'] == PageMethod.GET_ORIGIN_TRIALS
    assert result['params']['frameId'] == 'frame123'


def test_get_permissions_policy_state():
    """Test get_permissions_policy_state method."""
    result = PageCommands.get_permissions_policy_state(frame_id='frame123')
    assert result['method'] == PageMethod.GET_PERMISSIONS_POLICY_STATE
    assert result['params']['frameId'] == 'frame123'


def test_get_resource_content():
    """Test get_resource_content method."""
    result = PageCommands.get_resource_content(
        frame_id='frame123',
        url='https://example.com/resource.js'
    )
    assert result['method'] == PageMethod.GET_RESOURCE_CONTENT
    assert result['params']['frameId'] == 'frame123'
    assert result['params']['url'] == 'https://example.com/resource.js'


def test_get_resource_tree():
    """Test get_resource_tree method generates correct command."""
    result = PageCommands.get_resource_tree()
    assert result['method'] == PageMethod.GET_RESOURCE_TREE
    assert 'params' not in result


def test_produce_compilation_cache():
    """Test produce_compilation_cache method."""
    scripts = [
        {'url': 'https://example.com/script1.js', 'eager': True},
        {'url': 'https://example.com/script2.js', 'eager': False}
    ]
    result = PageCommands.produce_compilation_cache(scripts=scripts)
    assert result['method'] == PageMethod.PRODUCE_COMPILATION_CACHE
    assert result['params']['scripts'] == scripts


def test_screencast_frame_ack():
    """Test screencast_frame_ack method."""
    result = PageCommands.screencast_frame_ack(session_id='session123')
    assert result['method'] == PageMethod.SCREENCAST_FRAME_ACK
    assert result['params']['sessionId'] == 'session123'


def test_search_in_resource_minimal():
    """Test search_in_resource with minimal parameters."""
    result = PageCommands.search_in_resource(
        frame_id='frame123',
        url='https://example.com/resource.js',
        query='function'
    )
    assert result['method'] == PageMethod.SEARCH_IN_RESOURCE
    assert result['params']['frameId'] == 'frame123'
    assert result['params']['url'] == 'https://example.com/resource.js'
    assert result['params']['query'] == 'function'


def test_search_in_resource_with_options():
    """Test search_in_resource with all options."""
    result = PageCommands.search_in_resource(
        frame_id='frame123',
        url='https://example.com/resource.js',
        query='function.*test',
        case_sensitive=True,
        is_regex=True
    )
    assert result['method'] == PageMethod.SEARCH_IN_RESOURCE
    assert result['params']['frameId'] == 'frame123'
    assert result['params']['url'] == 'https://example.com/resource.js'
    assert result['params']['query'] == 'function.*test'
    assert result['params']['caseSensitive'] is True
    assert result['params']['isRegex'] is True


def test_set_ad_blocking_enabled():
    """Test set_ad_blocking_enabled method."""
    result = PageCommands.set_ad_blocking_enabled(enabled=True)
    assert result['method'] == PageMethod.SET_AD_BLOCKING_ENABLED
    assert result['params']['enabled'] is True


def test_set_font_families():
    """Test set_font_families method."""
    font_families = {
        'standard': 'Arial',
        'serif': 'Times New Roman',
        'sansSerif': 'Helvetica',
        'cursive': 'Comic Sans MS',
        'fantasy': 'Impact',
        'math': 'Latin Modern Math'
    }
    for_scripts = [
        {'script': 'Latn', 'fontFamilies': font_families}
    ]
    result = PageCommands.set_font_families(
        font_families=font_families,
        for_scripts=for_scripts
    )
    assert result['method'] == PageMethod.SET_FONT_FAMILIES
    assert result['params']['fontFamilies'] == font_families
    assert result['params']['forScripts'] == for_scripts


def test_set_font_sizes():
    """Test set_font_sizes method."""
    font_sizes = {
        'standard': 16,
        'fixed': 14
    }
    result = PageCommands.set_font_sizes(font_sizes=font_sizes)
    assert result['method'] == PageMethod.SET_FONT_SIZES
    assert result['params']['fontSizes'] == font_sizes


def test_set_prerendering_allowed():
    """Test set_prerendering_allowed method."""
    result = PageCommands.set_prerendering_allowed(is_allowed=True)
    assert result['method'] == PageMethod.SET_PRERENDERING_ALLOWED
    assert result['params']['isAllowed'] == True


def test_set_rph_registration_mode():
    """Test set_rph_registration_mode method."""
    from pydoll.protocol.page.methods import AutoResponseMode
    result = PageCommands.set_rph_registration_mode(mode=AutoResponseMode.AUTO_ACCEPT)
    assert result['method'] == PageMethod.SET_RPH_REGISTRATION_MODE
    assert result['params']['mode'] == AutoResponseMode.AUTO_ACCEPT


def test_set_spc_transaction_mode():
    """Test set_spc_transaction_mode method."""
    from pydoll.protocol.page.methods import AutoResponseMode
    result = PageCommands.set_spc_transaction_mode(mode=AutoResponseMode.AUTO_REJECT)
    assert result['method'] == PageMethod.SET_SPC_TRANSACTION_MODE
    assert result['params']['mode'] == AutoResponseMode.AUTO_REJECT


def test_set_web_lifecycle_state():
    """Test set_web_lifecycle_state method."""
    result = PageCommands.set_web_lifecycle_state(state=WebLifecycleState.FROZEN)
    assert result['method'] == PageMethod.SET_WEB_LIFECYCLE_STATE
    assert result['params']['state'] == WebLifecycleState.FROZEN


def test_start_screencast_minimal():
    """Test start_screencast with minimal parameters."""
    result = PageCommands.start_screencast(format=ScreencastFormat.JPEG)
    assert result['method'] == PageMethod.START_SCREENCAST
    assert result['params']['format'] == ScreencastFormat.JPEG


def test_start_screencast_with_all_params():
    """Test start_screencast with all parameters."""
    result = PageCommands.start_screencast(
        format=ScreencastFormat.PNG,
        quality=80,
        max_width=1920,
        max_height=1080,
        every_nth_frame=2
    )
    assert result['method'] == PageMethod.START_SCREENCAST
    assert result['params']['format'] == ScreencastFormat.PNG
    assert result['params']['quality'] == 80
    assert result['params']['maxWidth'] == 1920
    assert result['params']['maxHeight'] == 1080
    assert result['params']['everyNthFrame'] == 2


def test_stop_screencast():
    """Test stop_screencast method generates correct command."""
    result = PageCommands.stop_screencast()
    assert result['method'] == PageMethod.STOP_SCREENCAST
    assert 'params' not in result


def test_wait_for_debugger():
    """Test wait_for_debugger method generates correct command."""
    result = PageCommands.wait_for_debugger()
    assert result['method'] == PageMethod.WAIT_FOR_DEBUGGER
    assert 'params' not in result


================================================
FILE: tests/test_commands/test_runtime_commands.py
================================================
"""
Tests for RuntimeCommands class.

This module contains comprehensive tests for all RuntimeCommands methods,
verifying that they generate the correct CDP commands with proper parameters.
"""

from pydoll.commands.runtime_commands import RuntimeCommands
from pydoll.protocol.runtime.methods import RuntimeMethod


def test_add_binding_minimal():
    """Test add_binding with minimal parameters."""
    result = RuntimeCommands.add_binding(name='testBinding')
    assert result['method'] == RuntimeMethod.ADD_BINDING
    assert result['params']['name'] == 'testBinding'


def test_add_binding_with_context():
    """Test add_binding with execution context name."""
    result = RuntimeCommands.add_binding(
        name='testBinding',
        execution_context_name='main'
    )
    assert result['method'] == RuntimeMethod.ADD_BINDING
    assert result['params']['name'] == 'testBinding'
    assert result['params']['executionContextName'] == 'main'


def test_await_promise_minimal():
    """Test await_promise with minimal parameters."""
    result = RuntimeCommands.await_promise(promise_object_id='promise123')
    assert result['method'] == RuntimeMethod.AWAIT_PROMISE
    assert result['params']['promiseObjectId'] == 'promise123'


def test_await_promise_with_all_params():
    """Test await_promise with all parameters."""
    result = RuntimeCommands.await_promise(
        promise_object_id='promise123',
        return_by_value=True,
        generate_preview=False
    )
    assert result['method'] == RuntimeMethod.AWAIT_PROMISE
    assert result['params']['promiseObjectId'] == 'promise123'
    assert result['params']['returnByValue'] is True
    assert result['params']['generatePreview'] is False


def test_call_function_on_minimal():
    """Test call_function_on with minimal parameters."""
    result = RuntimeCommands.call_function_on(
        function_declaration='function() { return this.value; }'
    )
    assert result['method'] == RuntimeMethod.CALL_FUNCTION_ON
    assert result['params']['functionDeclaration'] == 'function() { return this.value; }'


def test_call_function_on_with_object_id():
    """Test call_function_on with object ID."""
    result = RuntimeCommands.call_function_on(
        function_declaration='function() { return this.value; }',
        object_id='obj123'
    )
    assert result['method'] == RuntimeMethod.CALL_FUNCTION_ON
    assert result['params']['functionDeclaration'] == 'function() { return this.value; }'
    assert result['params']['objectId'] == 'obj123'


def test_call_function_on_with_all_params():
    """Test call_function_on with all parameters."""
    arguments = [
        {'value': 42},
        {'value': 'test string'}
    ]
    serialization_options = {
        'serialization': 'deep',
        'maxDepth': 5
    }
    result = RuntimeCommands.call_function_on(
        function_declaration='function(a, b) { return a + b; }',
        object_id='obj123',
        arguments=arguments,
        silent=True,
        return_by_value=False,
        generate_preview=True,
        user_gesture=False,
        await_promise=True,
        execution_context_id='ctx456',
        object_group='testGroup',
        throw_on_side_effect=False,
        unique_context_id='unique789',
        serialization_options=serialization_options
    )
    assert result['method'] == RuntimeMethod.CALL_FUNCTION_ON
    assert result['params']['functionDeclaration'] == 'function(a, b) { return a + b; }'
    assert result['params']['objectId'] == 'obj123'
    assert result['params']['arguments'] == arguments
    assert result['params']['silent'] is True
    assert result['params']['returnByValue'] is False
    assert result['params']['generatePreview'] is True
    assert result['params']['userGesture'] is False
    assert result['params']['awaitPromise'] is True
    assert result['params']['executionContextId'] == 'ctx456'
    assert result['params']['objectGroup'] == 'testGroup'
    assert result['params']['throwOnSideEffect'] is False
    assert result['params']['uniqueContextId'] == 'unique789'
    assert result['params']['serializationOptions'] == serialization_options


def test_compile_script_minimal():
    """Test compile_script with minimal parameters."""
    result = RuntimeCommands.compile_script(expression='2 + 2', source_url='https://example.com/script.js')
    assert result['method'] == RuntimeMethod.COMPILE_SCRIPT
    assert result['params']['expression'] == '2 + 2'
    assert result['params']['sourceURL'] == 'https://example.com/script.js'


def test_compile_script_with_all_params():
    """Test compile_script with all parameters."""
    result = RuntimeCommands.compile_script(
        expression='function test() { return 42; }',
        source_url='https://example.com/script.js',
        persist_script=True,
        execution_context_id='ctx123'
    )
    assert result['method'] == RuntimeMethod.COMPILE_SCRIPT
    assert result['params']['expression'] == 'function test() { return 42; }'
    assert result['params']['sourceURL'] == 'https://example.com/script.js'
    assert result['params']['persistScript'] is True
    assert result['params']['executionContextId'] == 'ctx123'


def test_disable():
    """Test disable method generates correct command."""
    result = RuntimeCommands.disable()
    assert result['method'] == RuntimeMethod.DISABLE
    assert 'params' not in result


def test_enable():
    """Test enable method generates correct command."""
    result = RuntimeCommands.enable()
    assert result['method'] == RuntimeMethod.ENABLE
    assert 'params' not in result


def test_evaluate_minimal():
    """Test evaluate with minimal parameters."""
    result = RuntimeCommands.evaluate(expression='2 + 2')
    assert result['method'] == RuntimeMethod.EVALUATE
    assert result['params']['expression'] == '2 + 2'


def test_evaluate_with_basic_params():
    """Test evaluate with basic parameters."""
    result = RuntimeCommands.evaluate(
        expression='document.title',
        return_by_value=True,
        silent=False
    )
    assert result['method'] == RuntimeMethod.EVALUATE
    assert result['params']['expression'] == 'document.title'
    assert result['params']['returnByValue'] is True
    assert result['params']['silent'] is False


def test_evaluate_with_all_params():
    """Test evaluate with all parameters."""
    serialization_options = {
        'serialization': 'json',
        'maxDepth': 3
    }
    result = RuntimeCommands.evaluate(
        expression='window.location.href',
        object_group='testGroup',
        include_command_line_api=True,
        silent=False,
        context_id='ctx123',
        return_by_value=False,
        generate_preview=True,
        user_gesture=False,
        await_promise=True,
        throw_on_side_effect=False,
        timeout=5000.0,
        disable_breaks=True,
        repl_mode=False,
        allow_unsafe_eval_blocked_by_csp=False,
        unique_context_id='unique456',
        serialization_options=serialization_options
    )
    assert result['method'] == RuntimeMethod.EVALUATE
    assert result['params']['expression'] == 'window.location.href'
    assert result['params']['objectGroup'] == 'testGroup'
    assert result['params']['includeCommandLineAPI'] is True
    assert result['params']['silent'] is False
    assert result['params']['contextId'] == 'ctx123'
    assert result['params']['returnByValue'] is False
    assert result['params']['generatePreview'] is True
    assert result['params']['userGesture'] is False
    assert result['params']['awaitPromise'] is True
    assert result['params']['throwOnSideEffect'] is False
    assert result['params']['timeout'] == 5000.0
    assert result['params']['disableBreaks'] is True
    assert result['params']['replMode'] is False
    assert result['params']['allowUnsafeEvalBlockedByCSP'] is False
    assert result['params']['uniqueContextId'] == 'unique456'
    assert result['params']['serializationOptions'] == serialization_options


def test_get_properties_minimal():
    """Test get_properties with minimal parameters."""
    result = RuntimeCommands.get_properties(object_id='obj123')
    assert result['method'] == RuntimeMethod.GET_PROPERTIES
    assert result['params']['objectId'] == 'obj123'


def test_get_properties_with_all_params():
    """Test get_properties with all parameters."""
    result = RuntimeCommands.get_properties(
        object_id='obj123',
        own_properties=True,
        accessor_properties_only=False,
        generate_preview=True,
        non_indexed_properties_only=False
    )
    assert result['method'] == RuntimeMethod.GET_PROPERTIES
    assert result['params']['objectId'] == 'obj123'
    assert result['params']['ownProperties'] is True
    assert result['params']['accessorPropertiesOnly'] is False
    assert result['params']['generatePreview'] is True
    assert result['params']['nonIndexedPropertiesOnly'] is False


def test_global_lexical_scope_names_minimal():
    """Test global_lexical_scope_names with minimal parameters."""
    result = RuntimeCommands.global_lexical_scope_names()
    assert result['method'] == RuntimeMethod.GLOBAL_LEXICAL_SCOPE_NAMES
    assert result['params'] == {}


def test_global_lexical_scope_names_with_context():
    """Test global_lexical_scope_names with execution context ID."""
    result = RuntimeCommands.global_lexical_scope_names(
        execution_context_id='ctx123'
    )
    assert result['method'] == RuntimeMethod.GLOBAL_LEXICAL_SCOPE_NAMES
    assert result['params']['executionContextId'] == 'ctx123'


def test_query_objects_minimal():
    """Test query_objects with minimal parameters."""
    result = RuntimeCommands.query_objects(prototype_object_id='proto123')
    assert result['method'] == RuntimeMethod.QUERY_OBJECTS
    assert result['params']['prototypeObjectId'] == 'proto123'


def test_query_objects_with_group():
    """Test query_objects with object group."""
    result = RuntimeCommands.query_objects(
        prototype_object_id='proto123',
        object_group='testGroup'
    )
    assert result['method'] == RuntimeMethod.QUERY_OBJECTS
    assert result['params']['prototypeObjectId'] == 'proto123'
    assert result['params']['objectGroup'] == 'testGroup'


def test_release_object():
    """Test release_object method."""
    result = RuntimeCommands.release_object(object_id='obj123')
    assert result['method'] == RuntimeMethod.RELEASE_OBJECT
    assert result['params']['objectId'] == 'obj123'


def test_release_object_group():
    """Test release_object_group method."""
    result = RuntimeCommands.release_object_group(object_group='testGroup')
    assert result['method'] == RuntimeMethod.RELEASE_OBJECT_GROUP
    assert result['params']['objectGroup'] == 'testGroup'


def test_remove_binding():
    """Test remove_binding method."""
    result = RuntimeCommands.remove_binding(name='testBinding')
    assert result['method'] == RuntimeMethod.REMOVE_BINDING
    assert result['params']['name'] == 'testBinding'


def test_run_script_minimal():
    """Test run_script with minimal parameters."""
    result = RuntimeCommands.run_script(script_id='script123')
    assert result['method'] == RuntimeMethod.RUN_SCRIPT
    assert result['params']['scriptId'] == 'script123'


def test_run_script_with_all_params():
    """Test run_script with all parameters."""
    result = RuntimeCommands.run_script(
        script_id='script123',
        execution_context_id='ctx456',
        object_group='testGroup',
        silent=True,
        include_command_line_api=False,
        return_by_value=True,
        generate_preview=False,
        await_promise=True
    )
    assert result['method'] == RuntimeMethod.RUN_SCRIPT
    assert result['params']['scriptId'] == 'script123'
    assert result['params']['executionContextId'] == 'ctx456'
    assert result['params']['objectGroup'] == 'testGroup'
    assert result['params']['silent'] is True
    assert result['params']['includeCommandLineAPI'] is False
    assert result['params']['returnByValue'] is True
    assert result['params']['generatePreview'] is False
    assert result['params']['awaitPromise'] is True


def test_set_async_call_stack_depth():
    """Test set_async_call_stack_depth method."""
    result = RuntimeCommands.set_async_call_stack_depth(max_depth=10)
    assert result['method'] == RuntimeMethod.SET_ASYNC_CALL_STACK_DEPTH
    assert result['params']['maxDepth'] == 10


def test_set_custom_object_formatter_enabled():
    """Test set_custom_object_formatter_enabled method."""
    result = RuntimeCommands.set_custom_object_formatter_enabled(enabled=True)
    assert result['method'] == RuntimeMethod.SET_CUSTOM_OBJECT_FORMATTER_ENABLED
    assert result['params']['enabled'] is True


def test_set_max_call_stack_size_to_capture():
    """Test set_max_call_stack_size_to_capture method."""
    result = RuntimeCommands.set_max_call_stack_size_to_capture(size=100)
    assert result['method'] == RuntimeMethod.SET_MAX_CALL_STACK_SIZE_TO_CAPTURE
    assert result['params']['size'] == 100


def test_evaluate_simple_expression():
    """Test evaluate with a simple mathematical expression."""
    result = RuntimeCommands.evaluate(expression='Math.PI * 2')
    assert result['method'] == RuntimeMethod.EVALUATE
    assert result['params']['expression'] == 'Math.PI * 2'


def test_call_function_on_with_arguments():
    """Test call_function_on with function arguments."""
    arguments = [
        {'value': 10},
        {'value': 20}
    ]
    result = RuntimeCommands.call_function_on(
        function_declaration='function(a, b) { return a * b; }',
        object_id='obj123',
        arguments=arguments,
        return_by_value=True
    )
    assert result['method'] == RuntimeMethod.CALL_FUNCTION_ON
    assert result['params']['functionDeclaration'] == 'function(a, b) { return a * b; }'
    assert result['params']['objectId'] == 'obj123'
    assert result['params']['arguments'] == arguments
    assert result['params']['returnByValue'] is True


def test_get_properties_own_only():
    """Test get_properties with own properties only."""
    result = RuntimeCommands.get_properties(
        object_id='obj123',
        own_properties=True,
        generate_preview=False
    )
    assert result['method'] == RuntimeMethod.GET_PROPERTIES
    assert result['params']['objectId'] == 'obj123'
    assert result['params']['ownProperties'] is True
    assert result['params']['generatePreview'] is False


def test_evaluate_with_context():
    """Test evaluate with specific execution context."""
    result = RuntimeCommands.evaluate(
        expression='this.document.title',
        context_id='ctx123',
        include_command_line_api=True
    )
    assert result['method'] == RuntimeMethod.EVALUATE
    assert result['params']['expression'] == 'this.document.title'
    assert result['params']['contextId'] == 'ctx123'
    assert result['params']['includeCommandLineAPI'] is True


def test_compile_script_with_source_url():
    """Test compile_script with source URL."""
    result = RuntimeCommands.compile_script(
        expression='const x = 42; console.log(x);',
        source_url='test://script.js',
        persist_script=False
    )
    assert result['method'] == RuntimeMethod.COMPILE_SCRIPT
    assert result['params']['expression'] == 'const x = 42; console.log(x);'
    assert result['params']['sourceURL'] == 'test://script.js'
    assert result['params']['persistScript'] is False


================================================
FILE: tests/test_commands/test_storage_commands.py
================================================
"""
Tests for StorageCommands class.

This module contains comprehensive tests for all StorageCommands methods,
verifying that they generate the correct CDP commands with proper parameters.
"""

from pydoll.commands.storage_commands import StorageCommands
from pydoll.protocol.storage.methods import StorageMethod


def test_clear_cookies_minimal():
    """Test clear_cookies with minimal parameters."""
    result = StorageCommands.clear_cookies()
    assert result['method'] == StorageMethod.CLEAR_COOKIES
    assert result['params'] == {}


def test_clear_cookies_with_context():
    """Test clear_cookies with browser context ID."""
    result = StorageCommands.clear_cookies(browser_context_id='context123')
    assert result['method'] == StorageMethod.CLEAR_COOKIES
    assert result['params']['browserContextId'] == 'context123'


def test_clear_data_for_origin():
    """Test clear_data_for_origin method."""
    result = StorageCommands.clear_data_for_origin(
        origin='https://example.com',
        storage_types='cookies,local_storage'
    )
    assert result['method'] == StorageMethod.CLEAR_DATA_FOR_ORIGIN
    assert result['params']['origin'] == 'https://example.com'
    assert result['params']['storageTypes'] == 'cookies,local_storage'


def test_clear_data_for_storage_key():
    """Test clear_data_for_storage_key method."""
    result = StorageCommands.clear_data_for_storage_key(
        storage_key='storage_key_123',
        storage_types='indexeddb,cache_storage'
    )
    assert result['method'] == StorageMethod.CLEAR_DATA_FOR_STORAGE_KEY
    assert result['params']['storageKey'] == 'storage_key_123'
    assert result['params']['storageTypes'] == 'indexeddb,cache_storage'


def test_get_cookies_minimal():
    """Test get_cookies with minimal parameters."""
    result = StorageCommands.get_cookies()
    assert result['method'] == StorageMethod.GET_COOKIES
    assert result['params'] == {}


def test_get_cookies_with_context():
    """Test get_cookies with browser context ID."""
    result = StorageCommands.get_cookies(browser_context_id='context456')
    assert result['method'] == StorageMethod.GET_COOKIES
    assert result['params']['browserContextId'] == 'context456'


def test_get_storage_key_for_frame():
    """Test get_storage_key_for_frame method."""
    result = StorageCommands.get_storage_key_for_frame(frame_id='frame123')
    assert result['method'] == StorageMethod.GET_STORAGE_KEY_FOR_FRAME
    assert result['params']['frameId'] == 'frame123'


def test_get_usage_and_quota():
    """Test get_usage_and_quota method."""
    result = StorageCommands.get_usage_and_quota(origin='https://example.com')
    assert result['method'] == StorageMethod.GET_USAGE_AND_QUOTA
    assert result['params']['origin'] == 'https://example.com'


def test_set_cookies_minimal():
    """Test set_cookies with minimal parameters."""
    cookies = [
        {'name': 'cookie1', 'value': 'value1', 'domain': 'example.com'},
        {'name': 'cookie2', 'value': 'value2', 'domain': 'example.com'}
    ]
    result = StorageCommands.set_cookies(cookies=cookies)
    assert result['method'] == StorageMethod.SET_COOKIES
    assert result['params']['cookies'] == cookies


def test_set_cookies_with_context():
    """Test set_cookies with browser context ID."""
    cookies = [{'name': 'test', 'value': 'value', 'domain': 'test.com'}]
    result = StorageCommands.set_cookies(
        cookies=cookies,
        browser_context_id='context789'
    )
    assert result['method'] == StorageMethod.SET_COOKIES
    assert result['params']['cookies'] == cookies
    assert result['params']['browserContextId'] == 'context789'


def test_set_protected_audience_k_anonymity():
    """Test set_protected_audience_k_anonymity method."""
    hashes = ['hash1', 'hash2', 'hash3']
    result = StorageCommands.set_protected_audience_k_anonymity(
        owner='https://example.com',
        name='test_group',
        hashes=hashes
    )
    assert result['method'] == StorageMethod.SET_PROTECTED_AUDIENCE_K_ANONYMITY
    assert result['params']['owner'] == 'https://example.com'
    assert result['params']['name'] == 'test_group'
    assert result['params']['hashes'] == hashes


def test_track_cache_storage_for_origin():
    """Test track_cache_storage_for_origin method."""
    result = StorageCommands.track_cache_storage_for_origin(origin='https://example.com')
    assert result['method'] == StorageMethod.TRACK_CACHE_STORAGE_FOR_ORIGIN
    assert result['params']['origin'] == 'https://example.com'


def test_track_cache_storage_for_storage_key():
    """Test track_cache_storage_for_storage_key method."""
    result = StorageCommands.track_cache_storage_for_storage_key(storage_key='key123')
    assert result['method'] == StorageMethod.TRACK_CACHE_STORAGE_FOR_STORAGE_KEY
    assert result['params']['storageKey'] == 'key123'


def test_track_indexed_db_for_origin():
    """Test track_indexed_db_for_origin method."""
    result = StorageCommands.track_indexed_db_for_origin(origin='https://test.com')
    assert result['method'] == StorageMethod.TRACK_INDEXED_DB_FOR_ORIGIN
    assert result['params']['origin'] == 'https://test.com'


def test_track_indexed_db_for_storage_key():
    """Test track_indexed_db_for_storage_key method."""
    result = StorageCommands.track_indexed_db_for_storage_key(storage_key='key456')
    assert result['method'] == StorageMethod.TRACK_INDEXED_DB_FOR_STORAGE_KEY
    assert result['params']['storageKey'] == 'key456'


def test_untrack_cache_storage_for_origin():
    """Test untrack_cache_storage_for_origin method."""
    result = StorageCommands.untrack_cache_storage_for_origin(origin='https://example.org')
    assert result['method'] == StorageMethod.UNTRACK_CACHE_STORAGE_FOR_ORIGIN
    assert result['params']['origin'] == 'https://example.org'


def test_untrack_cache_storage_for_storage_key():
    """Test untrack_cache_storage_for_storage_key method."""
    result = StorageCommands.untrack_cache_storage_for_storage_key(storage_key='key789')
    assert result['method'] == StorageMethod.UNTRACK_CACHE_STORAGE_FOR_STORAGE_KEY
    assert result['params']['storageKey'] == 'key789'


def test_untrack_indexed_db_for_origin():
    """Test untrack_indexed_db_for_origin method."""
    result = StorageCommands.untrack_indexed_db_for_origin(origin='https://test.org')
    assert result['method'] == StorageMethod.UNTRACK_INDEXED_DB_FOR_ORIGIN
    assert result['params']['origin'] == 'https://test.org'


def test_untrack_indexed_db_for_storage_key():
    """Test untrack_indexed_db_for_storage_key method."""
    result = StorageCommands.untrack_indexed_db_for_storage_key(storage_key='key000')
    assert result['method'] == StorageMethod.UNTRACK_INDEXED_DB_FOR_STORAGE_KEY
    assert result['params']['storageKey'] == 'key000'


def test_clear_shared_storage_entries():
    """Test clear_shared_storage_entries method."""
    result = StorageCommands.clear_shared_storage_entries(owner_origin='https://owner.com')
    assert result['method'] == StorageMethod.CLEAR_SHARED_STORAGE_ENTRIES
    assert result['params']['ownerOrigin'] == 'https://owner.com'


def test_clear_trust_tokens():
    """Test clear_trust_tokens method."""
    result = StorageCommands.clear_trust_tokens(issuer_origin='https://issuer.com')
    assert result['method'] == StorageMethod.CLEAR_TRUST_TOKENS
    assert result['params']['issuerOrigin'] == 'https://issuer.com'


def test_delete_shared_storage_entry():
    """Test delete_shared_storage_entry method."""
    result = StorageCommands.delete_shared_storage_entry(
        owner_origin='https://owner.com',
        key='test_key'
    )
    assert result['method'] == StorageMethod.DELETE_SHARED_STORAGE_ENTRY
    assert result['params']['ownerOrigin'] == 'https://owner.com'
    assert result['params']['key'] == 'test_key'


def test_delete_storage_bucket():
    """Test delete_storage_bucket method."""
    bucket = {
        'storageKey': 'key123',
        'name': 'test_bucket'
    }
    result = StorageCommands.delete_storage_bucket(bucket=bucket)
    assert result['method'] == StorageMethod.DELETE_STORAGE_BUCKET
    assert result['params']['bucket'] == bucket


def test_get_affected_urls_for_third_party_cookie_metadata():
    """Test get_affected_urls_for_third_party_cookie_metadata method."""
    third_party_urls = ['https://third1.com', 'https://third2.com']
    result = StorageCommands.get_affected_urls_for_third_party_cookie_metadata(
        first_party_url='https://first.com',
        third_party_urls=third_party_urls
    )
    assert result['method'] == StorageMethod.GET_AFFECTED_URLS_FOR_THIRD_PARTY_COOKIE_METADATA
    assert result['params']['firstPartyUrl'] == 'https://first.com'
    assert result['params']['thirdPartyUrls'] == third_party_urls


def test_get_interest_group_details():
    """Test get_interest_group_details method."""
    result = StorageCommands.get_interest_group_details(
        owner_origin='https://owner.com',
        name='interest_group_1'
    )
    assert result['method'] == StorageMethod.GET_INTEREST_GROUP_DETAILS
    assert result['params']['ownerOrigin'] == 'https://owner.com'
    assert result['params']['name'] == 'interest_group_1'


def test_get_related_website_sets():
    """Test get_related_website_sets method."""
    result = StorageCommands.get_related_website_sets()
    assert result['method'] == StorageMethod.GET_RELATED_WEBSITE_SETS


def test_get_shared_storage_entries():
    """Test get_shared_storage_entries method."""
    result = StorageCommands.get_shared_storage_entries(owner_origin='https://shared.com')
    assert result['method'] == StorageMethod.GET_SHARED_STORAGE_ENTRIES
    assert result['params']['ownerOrigin'] == 'https://shared.com'


def test_get_shared_storage_metadata():
    """Test get_shared_storage_metadata method."""
    result = StorageCommands.get_shared_storage_metadata(owner_origin='https://metadata.com')
    assert result['method'] == StorageMethod.GET_SHARED_STORAGE_METADATA
    assert result['params']['ownerOrigin'] == 'https://metadata.com'


def test_get_trust_tokens():
    """Test get_trust_tokens method."""
    result = StorageCommands.get_trust_tokens()
    assert result['method'] == StorageMethod.GET_TRUST_TOKENS
    assert result['params'] == {}


def test_override_quota_for_origin_minimal():
    """Test override_quota_for_origin with minimal parameters."""
    result = StorageCommands.override_quota_for_origin(origin='https://quota.com')
    assert result['method'] == StorageMethod.OVERRIDE_QUOTA_FOR_ORIGIN
    assert result['params']['origin'] == 'https://quota.com'


def test_override_quota_for_origin_with_size():
    """Test override_quota_for_origin with quota size."""
    result = StorageCommands.override_quota_for_origin(
        origin='https://quota.com',
        quota_size=1024000.0
    )
    assert result['method'] == StorageMethod.OVERRIDE_QUOTA_FOR_ORIGIN
    assert result['params']['origin'] == 'https://quota.com'
    assert result['params']['quotaSize'] == 1024000.0


def test_reset_shared_storage_budget():
    """Test reset_shared_storage_budget method."""
    result = StorageCommands.reset_shared_storage_budget(owner_origin='https://budget.com')
    assert result['method'] == StorageMethod.RESET_SHARED_STORAGE_BUDGET
    assert result['params']['ownerOrigin'] == 'https://budget.com'


def test_run_bounce_tracking_mitigations():
    """Test run_bounce_tracking_mitigations method."""
    result = StorageCommands.run_bounce_tracking_mitigations()
    assert result['method'] == StorageMethod.RUN_BOUNCE_TRACKING_MITIGATIONS
    assert result['params'] == {}


def test_send_pending_attribution_reports():
    """Test send_pending_attribution_reports method."""
    result = StorageCommands.send_pending_attribution_reports()
    assert result['method'] == StorageMethod.SEND_PENDING_ATTRIBUTION_REPORTS
    assert result['params'] == {}


def test_set_attribution_reporting_local_testing_mode():
    """Test set_attribution_reporting_local_testing_mode method."""
    result = StorageCommands.set_attribution_reporting_local_testing_mode(enabled=True)
    assert result['method'] == StorageMethod.SET_ATTRIBUTION_REPORTING_LOCAL_TESTING_MODE
    assert result['params']['enabled'] is True


def test_set_attribution_reporting_tracking():
    """Test set_attribution_reporting_tracking method."""
    result = StorageCommands.set_attribution_reporting_tracking(enable=False)
    assert result['method'] == StorageMethod.SET_ATTRIBUTION_REPORTING_TRACKING
    assert result['params']['enable'] is False


def test_set_interest_group_auction_tracking():
    """Test set_interest_group_auction_tracking method."""
    result = StorageCommands.set_interest_group_auction_tracking(enable=True)
    assert result['method'] == StorageMethod.SET_INTEREST_GROUP_AUCTION_TRACKING
    assert result['params']['enable'] is True


def test_set_interest_group_tracking():
    """Test set_interest_group_tracking method."""
    result = StorageCommands.set_interest_group_tracking(enable=False)
    assert result['method'] == StorageMethod.SET_INTEREST_GROUP_TRACKING
    assert result['params']['enable'] is False


def test_set_shared_storage_entry_minimal():
    """Test set_shared_storage_entry with minimal parameters."""
    result = StorageCommands.set_shared_storage_entry(
        owner_origin='https://storage.com',
        key='test_key',
        value='test_value'
    )
    assert result['method'] == StorageMethod.SET_SHARED_STORAGE_ENTRY
    assert result['params']['ownerOrigin'] == 'https://storage.com'
    assert result['params']['key'] == 'test_key'
    assert result['params']['value'] == 'test_value'


def test_set_shared_storage_entry_with_ignore():
    """Test set_shared_storage_entry with ignore_if_present parameter."""
    result = StorageCommands.set_shared_storage_entry(
        owner_origin='https://storage.com',
        key='test_key',
        value='test_value',
        ignore_if_present=True
    )
    assert result['method'] == StorageMethod.SET_SHARED_STORAGE_ENTRY
    assert result['params']['ownerOrigin'] == 'https://storage.com'
    assert result['params']['key'] == 'test_key'
    assert result['params']['value'] == 'test_value'
    assert result['params']['ignoreIfPresent'] is True


def test_set_shared_storage_tracking():
    """Test set_shared_storage_tracking method."""
    result = StorageCommands.set_shared_storage_tracking(enable=True)
    assert result['method'] == StorageMethod.SET_SHARED_STORAGE_TRACKING
    assert result['params']['enable'] is True


def test_set_storage_bucket_tracking():
    """Test set_storage_bucket_tracking method."""
    result = StorageCommands.set_storage_bucket_tracking(
        storage_key='bucket_key_123',
        enable=False
    )
    assert result['method'] == StorageMethod.SET_STORAGE_BUCKET_TRACKING
    assert result['params']['storageKey'] == 'bucket_key_123'
    assert result['params']['enable'] is False


def test_clear_data_for_origin_all_types():
    """Test clear_data_for_origin with all storage types."""
    result = StorageCommands.clear_data_for_origin(
        origin='https://example.com',
        storage_types='all'
    )
    assert result['method'] == StorageMethod.CLEAR_DATA_FOR_ORIGIN
    assert result['params']['origin'] == 'https://example.com'
    assert result['params']['storageTypes'] == 'all'


def test_set_cookies_complex():
    """Test set_cookies with complex cookie parameters."""
    cookies = [
        {
            'name': 'session_id',
            'value': 'abc123',
            'domain': 'example.com',
            'path': '/',
            'secure': True,
            'httpOnly': True,
            'sameSite': 'Strict'
        }
    ]
    result = StorageCommands.set_cookies(cookies=cookies)
    assert result['method'] == StorageMethod.SET_COOKIES
    assert result['params']['cookies'] == cookies


================================================
FILE: tests/test_commands/test_target_commands.py
================================================
"""
Tests for TargetCommands class.

This module contains comprehensive tests for all TargetCommands methods,
verifying that they generate the correct CDP commands with proper parameters.
"""

from pydoll.commands.target_commands import TargetCommands
from pydoll.protocol.browser.types import WindowState
from pydoll.protocol.target.methods import TargetMethod


def test_activate_target():
    """Test activate_target method."""
    result = TargetCommands.activate_target(target_id='target123')
    assert result['method'] == TargetMethod.ACTIVATE_TARGET
    assert result['params']['targetId'] == 'target123'


def test_attach_to_target_minimal():
    """Test attach_to_target with minimal parameters."""
    result = TargetCommands.attach_to_target(target_id='target456')
    assert result['method'] == TargetMethod.ATTACH_TO_TARGET
    assert result['params']['targetId'] == 'target456'


def test_attach_to_target_with_flatten():
    """Test attach_to_target with flatten parameter."""
    result = TargetCommands.attach_to_target(target_id='target456', flatten=True)
    assert result['method'] == TargetMethod.ATTACH_TO_TARGET
    assert result['params']['targetId'] == 'target456'
    assert result['params']['flatten'] is True


def test_close_target():
    """Test close_target method."""
    result = TargetCommands.close_target(target_id='target789')
    assert result['method'] == TargetMethod.CLOSE_TARGET
    assert result['params']['targetId'] == 'target789'


def test_create_browser_context_minimal():
    """Test create_browser_context with minimal parameters."""
    result = TargetCommands.create_browser_context()
    assert result['method'] == TargetMethod.CREATE_BROWSER_CONTEXT
    assert result['params'] == {}


def test_create_browser_context_with_all_params():
    """Test create_browser_context with all parameters."""
    origins = ['https://example.com', 'https://test.com']
    result = TargetCommands.create_browser_context(
        dispose_on_detach=True,
        proxy_server='socks5://192.168.1.100:1080',
        proxy_bypass_list='*.example.com,localhost',
        origins_with_universal_network_access=origins
    )
    assert result['method'] == TargetMethod.CREATE_BROWSER_CONTEXT
    assert result['params']['disposeOnDetach'] is True
    assert result['params']['proxyServer'] == 'socks5://192.168.1.100:1080'
    assert result['params']['proxyBypassList'] == '*.example.com,localhost'
    assert result['params']['originsWithUniversalNetworkAccess'] == origins


def test_create_target_minimal():
    """Test create_target with minimal parameters."""
    result = TargetCommands.create_target(url='https://example.com')
    assert result['method'] == TargetMethod.CREATE_TARGET
    assert result['params']['url'] == 'https://example.com'


def test_create_target_with_position_and_size():
    """Test create_target with position and size parameters."""
    result = TargetCommands.create_target(
        url='https://test.com',
        left=100,
        top=200,
        width=800,
        height=600
    )
    assert result['method'] == TargetMethod.CREATE_TARGET
    assert result['params']['url'] == 'https://test.com'
    assert result['params']['left'] == 100
    assert result['params']['top'] == 200
    assert result['params']['width'] == 800
    assert result['params']['height'] == 600


def test_create_target_with_window_state():
    """Test create_target with window state."""
    result = TargetCommands.create_target(
        url='https://example.com',
        window_state=WindowState.MAXIMIZED
    )
    assert result['method'] == TargetMethod.CREATE_TARGET
    assert result['params']['url'] == 'https://example.com'
    assert result['params']['windowState'] == WindowState.MAXIMIZED


def test_create_target_with_all_params():
    """Test create_target with all parameters."""
    result = TargetCommands.create_target(
        url='https://full-test.com',
        left=50,
        top=100,
        width=1200,
        height=800,
        window_state=WindowState.NORMAL,
        browser_context_id='context123',
        enable_begin_frame_control=True,
        new_window=False,
        background=True,
        for_tab=False,
        hidden=True
    )
    assert result['method'] == TargetMethod.CREATE_TARGET
    assert result['params']['url'] == 'https://full-test.com'
    assert result['params']['left'] == 50
    assert result['params']['top'] == 100
    assert result['params']['width'] == 1200
    assert result['params']['height'] == 800
    assert result['params']['windowState'] == WindowState.NORMAL
    assert result['params']['browserContextId'] == 'context123'
    assert result['params']['enableBeginFrameControl'] is True
    assert result['params']['newWindow'] is False
    assert result['params']['background'] is True
    assert result['params']['forTab'] is False
    assert result['params']['hidden'] is True


def test_detach_from_target_minimal():
    """Test detach_from_target with minimal parameters."""
    result = TargetCommands.detach_from_target()
    assert result['method'] == TargetMethod.DETACH_FROM_TARGET
    assert result['params'] == {}


def test_detach_from_target_with_session():
    """Test detach_from_target with session ID."""
    result = TargetCommands.detach_from_target(session_id='session123')
    assert result['method'] == TargetMethod.DETACH_FROM_TARGET
    assert result['params']['sessionId'] == 'session123'


def test_dispose_browser_context():
    """Test dispose_browser_context method."""
    result = TargetCommands.dispose_browser_context(browser_context_id='context456')
    assert result['method'] == TargetMethod.DISPOSE_BROWSER_CONTEXT
    assert result['params']['browserContextId'] == 'context456'


def test_get_browser_contexts():
    """Test get_browser_contexts method."""
    result = TargetCommands.get_browser_contexts()
    assert result['method'] == TargetMethod.GET_BROWSER_CONTEXTS
    assert result['params'] == {}


def test_get_targets_minimal():
    """Test get_targets with minimal parameters."""
    result = TargetCommands.get_targets()
    assert result['method'] == TargetMethod.GET_TARGETS
    assert result['params'] == {}


def test_get_targets_with_filter():
    """Test get_targets with filter parameter."""
    filter_list = [{'type': 'page'}, {'type': 'worker'}]
    result = TargetCommands.get_targets(filter=filter_list)
    assert result['method'] == TargetMethod.GET_TARGETS
    assert result['params']['filter'] == filter_list


def test_set_auto_attach_minimal():
    """Test set_auto_attach with minimal parameters."""
    result = TargetCommands.set_auto_attach(auto_attach=True)
    assert result['method'] == TargetMethod.SET_AUTO_ATTACH
    assert result['params']['autoAttach'] is True


def test_set_auto_attach_with_all_params():
    """Test set_auto_attach with all parameters."""
    filter_list = [{'type': 'page'}]
    result = TargetCommands.set_auto_attach(
        auto_attach=False,
        wait_for_debugger_on_start=True,
        flatten=False,
        filter=filter_list
    )
    assert result['method'] == TargetMethod.SET_AUTO_ATTACH
    assert result['params']['autoAttach'] is False
    assert result['params']['waitForDebuggerOnStart'] is True
    assert result['params']['flatten'] is False
    assert result['params']['filter'] == filter_list


def test_set_discover_targets_minimal():
    """Test set_discover_targets with minimal parameters."""
    result = TargetCommands.set_discover_targets(discover=True)
    assert result['method'] == TargetMethod.SET_DISCOVER_TARGETS
    assert result['params']['discover'] is True


def test_set_discover_targets_with_filter():
    """Test set_discover_targets with filter parameter."""
    filter_list = [{'type': 'service_worker'}]
    result = TargetCommands.set_discover_targets(discover=False, filter=filter_list)
    assert result['method'] == TargetMethod.SET_DISCOVER_TARGETS
    assert result['params']['discover'] is False
    assert result['params']['filter'] == filter_list


def test_attach_to_browser_target():
    """Test attach_to_browser_target method."""
    result = TargetCommands.attach_to_browser_target(session_id='browser_session123')
    assert result['method'] == TargetMethod.ATTACH_TO_BROWSER_TARGET
    assert result['params']['sessionId'] == 'browser_session123'


def test_get_target_info():
    """Test get_target_info method."""
    result = TargetCommands.get_target_info(target_id='info_target123')
    assert result['method'] == TargetMethod.GET_TARGET_INFO
    assert result['params']['targetId'] == 'info_target123'


def test_set_remote_locations():
    """Test set_remote_locations method."""
    locations = [
        {
            'host': 'remote1.example.com',
            'port': 9222
        },
        {
            'host': 'remote2.example.com',
            'port': 9223
        }
    ]
    result = TargetCommands.set_remote_locations(locations=locations)
    assert result['method'] == TargetMethod.SET_REMOTE_LOCATIONS
    assert result['params']['locations'] == locations


def test_create_target_about_blank():
    """Test create_target with about:blank URL."""
    result = TargetCommands.create_target(url='')
    assert result['method'] == TargetMethod.CREATE_TARGET
    assert result['params']['url'] == ''


def test_create_target_new_window():
    """Test create_target with new window option."""
    result = TargetCommands.create_target(
        url='https://newwindow.com',
        new_window=True,
        width=1024,
        height=768
    )
    assert result['method'] == TargetMethod.CREATE_TARGET
    assert result['params']['url'] == 'https://newwindow.com'
    assert result['params']['newWindow'] is True
    assert result['params']['width'] == 1024
    assert result['params']['height'] == 768


def test_create_target_background():
    """Test create_target with background option."""
    result = TargetCommands.create_target(
        url='https://background.com',
        background=True
    )
    assert result['method'] == TargetMethod.CREATE_TARGET
    assert result['params']['url'] == 'https://background.com'
    assert result['params']['background'] is True


def test_create_target_for_tab():
    """Test create_target with for_tab option."""
    result = TargetCommands.create_target(
        url='https://tab.com',
        for_tab=True
    )
    assert result['method'] == TargetMethod.CREATE_TARGET
    assert result['params']['url'] == 'https://tab.com'
    assert result['params']['forTab'] is True


def test_create_target_hidden():
    """Test create_target with hidden option."""
    result = TargetCommands.create_target(
        url='https://hidden.com',
        hidden=True
    )
    assert result['method'] == TargetMethod.CREATE_TARGET
    assert result['params']['url'] == 'https://hidden.com'
    assert result['params']['hidden'] is True


def test_create_browser_context_with_proxy():
    """Test create_browser_context with proxy configuration."""
    result = TargetCommands.create_browser_context(
        proxy_server='http://proxy.example.com:8080',
        proxy_bypass_list='localhost,127.0.0.1'
    )
    assert result['method'] == TargetMethod.CREATE_BROWSER_CONTEXT
    assert result['params']['proxyServer'] == 'http://proxy.example.com:8080'
    assert result['params']['proxyBypassList'] == 'localhost,127.0.0.1'


def test_create_target_with_context():
    """Test create_target with browser context."""
    result = TargetCommands.create_target(
        url='https://context-test.com',
        browser_context_id='isolated_context'
    )
    assert result['method'] == TargetMethod.CREATE_TARGET
    assert result['params']['url'] == 'https://context-test.com'
    assert result['params']['browserContextId'] == 'isolated_context'


def test_set_auto_attach_disabled():
    """Test set_auto_attach with auto attach disabled."""
    result = TargetCommands.set_auto_attach(
        auto_attach=False,
        wait_for_debugger_on_start=False
    )
    assert result['method'] == TargetMethod.SET_AUTO_ATTACH
    assert result['params']['autoAttach'] is False
    assert result['params']['waitForDebuggerOnStart'] is False


================================================
FILE: tests/test_connection_handler.py
================================================
import asyncio
import json
from unittest.mock import AsyncMock, MagicMock

import pytest
import pytest_asyncio
import websockets
from websockets.protocol import State

from pydoll import exceptions
from pydoll.connection import ConnectionHandler


@pytest_asyncio.fixture
async def connection_handler():
    handler = ConnectionHandler(connection_port=9222)
    handler._ws_connection = AsyncMock()
    handler._ws_connection.state = State.OPEN
    return handler


@pytest_asyncio.fixture
async def connection_handler_closed():
    handler = ConnectionHandler(
        connection_port=9222,
        ws_address_resolver=AsyncMock(return_value='ws://localhost:9222'),
        ws_connector=AsyncMock(),
    )
    handler._ws_connection = AsyncMock()
    handler._ws_connection.state = State.CLOSED
    return handler


@pytest_asyncio.fixture
async def connection_handler_with_page_id():
    handler = ConnectionHandler(
        page_id='ABCD',
        connection_port=9222,
        ws_address_resolver=AsyncMock(return_value='ws://localhost:9222'),
        ws_connector=AsyncMock(),
    )
    handler._ws_connection = AsyncMock()
    handler._ws_connection.state = State.CLOSED
    return handler


@pytest.mark.asyncio
async def test_resolve_ws_address_priority_ws_address_over_port_and_page():
    handler = ConnectionHandler(
        connection_port=9333,
        page_id='SHOULD_NOT_BE_USED',
        ws_address='ws://host:9999/devtools/page/REAL',
        ws_address_resolver=AsyncMock(return_value='ws://host:9333/devtools/browser/ALT'),
        ws_connector=AsyncMock(),
    )
    # Should return the explicit ws_address regardless of others
    resolved = await handler._resolve_ws_address()
    assert resolved == 'ws://host:9999/devtools/page/REAL'


@pytest.mark.asyncio
async def test_ping_success(connection_handler):
    connection_handler._ws_connection.ping = AsyncMock()
    result = await connection_handler.ping()
    assert result is True


@pytest.mark.asyncio
async def test_ping_failure(connection_handler):
    connection_handler._ws_connection.ping = AsyncMock(
        side_effect=Exception('Ping failed')
    )
    result = await connection_handler.ping()
    assert result is False


@pytest.mark.asyncio
async def test_execute_command_success(connection_handler):
    command = {'id': 1, 'method': 'SomeMethod'}
    response = json.dumps({'id': 1, 'result': 'success'})

    connection_handler._ws_connection.send = AsyncMock()
    future = asyncio.Future()
    future.set_result(response)
    connection_handler._command_manager.create_command_future = MagicMock(
        return_value=future
    )
    result = await connection_handler.execute_command(command)
    assert result == {'id': 1, 'result': 'success'}


@pytest.mark.asyncio
async def test_execute_command_timeout(connection_handler):
    command = {'id': 2, 'method': 'TimeoutMethod'}

    connection_handler._ws_connection.send = AsyncMock()
    connection_handler._command_manager.create_command_future = MagicMock(
        return_value=asyncio.Future()
    )

    with pytest.raises(exceptions.CommandExecutionTimeout):
        await connection_handler.execute_command(command, timeout=0.1)


@pytest.mark.asyncio
async def test_execute_command_connection_closed_exception(connection_handler):
    connection_handler._ws_connection.send = AsyncMock(
        side_effect=websockets.ConnectionClosed(
            1000, 'Normal Closure', rcvd_then_sent=True
        )
    )
    connection_handler._ws_connection.close = AsyncMock()
    connection_handler._receive_task = AsyncMock(spec=asyncio.Task)
    connection_handler._receive_task.done = MagicMock(return_value=False)
    with pytest.raises(exceptions.WebSocketConnectionClosed):
        await connection_handler.execute_command({
            'id': 1,
            'method': 'SomeMethod',
        })


@pytest.mark.asyncio
async def test_register_callback(connection_handler):
    connection_handler._events_handler.register_callback = MagicMock(
        return_value=123
    )
    callback_id = await connection_handler.register_callback(
        'event', lambda x: x
    )
    assert callback_id == 123


@pytest.mark.asyncio
async def test_remove_callback(connection_handler):
    connection_handler._events_handler.remove_callback = MagicMock(
        return_value=True
    )
    result = await connection_handler.remove_callback(123)
    assert result is True


@pytest.mark.asyncio
async def test_clear_callbacks(connection_handler):
    connection_handler._events_handler.clear_callbacks = MagicMock(
        return_value=None
    )
    result = await connection_handler.clear_callbacks()
    connection_handler._events_handler.clear_callbacks.assert_called_once()
    assert result is None


@pytest.mark.asyncio
async def test_close(connection_handler):
    connection_handler._ws_connection.close = AsyncMock()
    connection_handler.clear_callbacks = AsyncMock()

    await connection_handler.close()
    connection_handler.clear_callbacks.assert_awaited_once()
    connection_handler._ws_connection.close.assert_awaited_once()

    connection_handler._ws_connection.close.side_effect = websockets.ConnectionClosed(
        1000, 'Normal Closure', rcvd_then_sent=True
    )
    await connection_handler.close()


@pytest.mark.asyncio
async def test_execute_command_connection_closed(connection_handler_closed):
    mock_connector = AsyncMock(
        return_value=connection_handler_closed._ws_connection
    )
    connection_handler_closed._ws_connector = mock_connector

    command = {'id': 1, 'method': 'SomeMethod'}
    response = json.dumps({'id': 1, 'result': 'success'})

    connection_handler_closed._ws_connection.send = AsyncMock()
    future = asyncio.Future()
    future.set_result(response)
    connection_handler_closed._command_manager.create_command_future = (
        MagicMock(return_value=future)
    )
    result = await connection_handler_closed.execute_command(command)
    mock_connector.assert_awaited_once()  # Verifica se tentou reconectar
    connection_handler_closed._ws_connection.send.assert_awaited_once_with(
        json.dumps(command)
    )
    assert result == {'id': 1, 'result': 'success'}


@pytest.mark.asyncio
async def test__is_command_response_true(connection_handler):
    command = {'id': 1, 'method': 'SomeMethod'}
    result = connection_handler._is_command_response(command)
    assert result is True


@pytest.mark.asyncio
async def test__is_command_response_false(connection_handler):
    command = {'id': 'string', 'method': 'SomeMethod'}
    result = connection_handler._is_command_response(command)
    assert result is False


@pytest.mark.asyncio
async def test__resolve_ws_address_with_page_id(
    connection_handler_with_page_id,
):
    result = await connection_handler_with_page_id._resolve_ws_address()
    assert result == 'ws://localhost:9222/devtools/page/ABCD'


@pytest.mark.asyncio
async def test__incoming_messages(connection_handler):
    connection_handler._ws_connection.recv = AsyncMock(
        return_value='{"id": 1, "method": "SomeMethod"}'
    )
    async_generator = connection_handler._incoming_messages()
    result = await anext(async_generator)
    assert result == '{"id": 1, "method": "SomeMethod"}'


@pytest.mark.asyncio
async def test__process_single_message(connection_handler):
    raw_message = '{"id": 1, "method": "SomeMethod"}'
    connection_handler._command_manager.resolve_command = MagicMock()
    await connection_handler._process_single_message(raw_message)
    connection_handler._command_manager.resolve_command.assert_called_once_with(
        1, raw_message
    )


@pytest.mark.asyncio
async def test__process_single_message_invalid_command(connection_handler):
    raw_message = 'not a valid JSON'
    result = await connection_handler._process_single_message(raw_message)
    assert result is None


@pytest.mark.asyncio
async def test__process_single_message_event(connection_handler):
    event = {'method': 'SomeEvent'}
    connection_handler._events_handler.process_event = AsyncMock()
    await connection_handler._process_single_message(json.dumps(event))
    connection_handler._events_handler.process_event.assert_called_once_with(
        event
    )


@pytest.mark.asyncio
async def test__process_single_message_event_with_callback(connection_handler):
    event = {'method': 'SomeEvent'}
    callback = MagicMock(return_value=None)
    await connection_handler.register_callback('SomeEvent', callback)
    await connection_handler._process_single_message(json.dumps(event))
    callback.assert_called_once_with(event)


@pytest.mark.asyncio
async def test__receive_events_flow(connection_handler):
    async def fake_incoming_messages():
        yield '{"id": 1, "method": "TestCommand"}'
        yield '{"method": "TestEvent"}'

    connection_handler._incoming_messages = fake_incoming_messages

    connection_handler._handle_command_message = AsyncMock()
    connection_handler._handle_event_message = AsyncMock()

    await connection_handler._receive_events()

    connection_handler._handle_command_message.assert_awaited_once_with({
        'id': 1,
        'method': 'TestCommand',
    })
    connection_handler._handle_event_message.assert_awaited_once_with({
        'method': 'TestEvent'
    })


@pytest.mark.asyncio
async def test__receive_events_connection_closed(connection_handler):
    async def fake_incoming_messages_connection_closed():
        raise websockets.ConnectionClosed(
            1000, 'Normal Closure', rcvd_then_sent=True
        )
        yield  # Garante que seja um async generator

    connection_handler._incoming_messages = (
        fake_incoming_messages_connection_closed
    )
    await connection_handler._receive_events()


@pytest.mark.asyncio
async def test__receive_events_unexpected_exception(connection_handler):
    async def fake_incoming_messages_unexpected_error():
        raise ValueError('Unexpected error in async generator')
        yield  # Garante que seja um async generator

    connection_handler._incoming_messages = (
        fake_incoming_messages_unexpected_error
    )

    with pytest.raises(
        ValueError, match='Unexpected error in async generator'
    ):
        await connection_handler._receive_events()


@pytest.mark.asyncio
async def test__aenter__(connection_handler):
    result = await connection_handler.__aenter__()
    assert result is connection_handler


@pytest.mark.asyncio
async def test__aexit__(connection_handler):
    await connection_handler.register_callback('SomeEvent', MagicMock())
    connection_handler.clear_callbacks = AsyncMock()
    connection_handler._ws_connection.close = AsyncMock()
    await connection_handler.__aexit__(None, None, None)
    connection_handler.clear_callbacks.assert_awaited_once()
    connection_handler._ws_connection.close.assert_awaited_once()


def test__repr__(connection_handler):
    result = connection_handler.__repr__()
    assert result == 'ConnectionHandler(port=9222)'


def test__str__(connection_handler):
    result = connection_handler.__str__()
    assert result == 'ConnectionHandler(port=9222)'


================================================
FILE: tests/test_core_integration.py
================================================
"""Integration tests for core WebElement/Tab behaviors (non-iframe)."""

import asyncio
from pathlib import Path

import pytest

from pydoll.browser.chromium import Chrome
from pydoll.elements.web_element import WebElement


class TestCoreFindQuery:
    """Find and query basics on a simple page."""

    @pytest.mark.asyncio
    async def test_find_by_common_selectors(self, ci_chrome_options):
        test_file = Path(__file__).parent / 'pages' / 'test_core_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(0.5)

            # id
            heading = await tab.find(id='main-heading')
            assert heading is not None
            assert isinstance(heading, WebElement)
            assert heading.get_attribute('id') == 'main-heading'

            # class_name (first occurrence)
            first_item = await tab.find(class_name='item')
            assert first_item is not None
            assert 'item' in (first_item.get_attribute('class') or '')

            # name
            name_input = await tab.find(name='username')
            assert name_input is not None
            assert name_input.get_attribute('id') == 'text-input'

            # tag_name (first button)
            button = await tab.find(tag_name='button')
            assert button is not None
            assert button.get_attribute('id') == 'btn-1'

    @pytest.mark.asyncio
    async def test_query_css_and_xpath(self, ci_chrome_options):
        test_file = Path(__file__).parent / 'pages' / 'test_core_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(0.5)

            # CSS: list items
            items = await tab.query('.list-item', find_all=True)
            assert items is not None
            assert len(items) == 3

            # XPath absolute
            deep_span = await tab.query('//*[@id="deep-section"]//span[@id="deep-span"]')
            assert deep_span is not None
            text = await deep_span.text
            assert 'Deep nested element' in text

            # XPath relative from container
            container = await tab.find(id='deep-section')
            rel_span = await container.find(xpath='.//span[@id="deep-span"]')
            assert rel_span is not None
            text2 = await rel_span.text
            assert 'Deep nested element' in text2


class TestCoreClickAndInput:
    """Click and text insertion behaviors."""

    @pytest.mark.asyncio
    async def test_click_increments_counter(self, ci_chrome_options):
        test_file = Path(__file__).parent / 'pages' / 'test_core_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(0.5)

            button = await tab.find(id='btn-1')
            counter = await tab.find(id='btn-1-count')

            # before
            before_text = await counter.text
            assert before_text.strip() == '0'

            await button.click()
            await asyncio.sleep(0.2)
            after_text = await counter.text
            assert after_text.strip() == '1'

            await button.click()
            await asyncio.sleep(0.2)
            after_text2 = await counter.text
            assert after_text2.strip() == '2'

    @pytest.mark.asyncio
    async def test_insert_text_input_and_textarea(self, ci_chrome_options):
        test_file = Path(__file__).parent / 'pages' / 'test_core_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(0.5)

            # input
            input_el = await tab.find(id='text-input')
            await input_el.insert_text('Hello')
            await asyncio.sleep(0.1)
            assert 'Hello' in (input_el.get_attribute('value') or '')

            # textarea
            textarea = await tab.find(id='text-area')
            await textarea.insert_text('World')
            await asyncio.sleep(0.1)
            assert 'World' in (textarea.get_attribute('value') or '')

    @pytest.mark.asyncio
    async def test_clear_input_and_textarea(self, ci_chrome_options):
        """Test clear() removes existing value from input and textarea."""
        test_file = Path(__file__).parent / 'pages' / 'test_core_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(0.5)

            # -- input: insert text, clear, verify empty, insert again --
            input_el = await tab.find(id='text-input')
            await input_el.insert_text('old value')
            await asyncio.sleep(0.1)

            await input_el.clear()
            await asyncio.sleep(0.1)
            prop = await input_el.execute_script('return this.value', return_by_value=True)
            assert prop['result']['result']['value'] == ''

            await input_el.insert_text('new value')
            await asyncio.sleep(0.1)
            prop = await input_el.execute_script('return this.value', return_by_value=True)
            assert prop['result']['result']['value'] == 'new value'

            # -- textarea: insert text, clear, verify empty --
            textarea = await tab.find(id='text-area')
            await textarea.insert_text('old message')
            await asyncio.sleep(0.1)

            await textarea.clear()
            await asyncio.sleep(0.1)
            prop = await textarea.execute_script('return this.value', return_by_value=True)
            assert prop['result']['result']['value'] == ''

    @pytest.mark.asyncio
    async def test_select_option_click(self, ci_chrome_options):
        test_file = Path(__file__).parent / 'pages' / 'test_core_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(0.5)

            select_el = await tab.find(id='simple-select')
            assert select_el is not None

            # click on option 'beta'
            opt_beta = await select_el.find(xpath='.//option[@value="beta"]')
            await opt_beta.click()
            await asyncio.sleep(0.2)

            # verify using JS value read
            prop = await select_el.execute_script('return this.value', return_by_value=True)
            current_value = prop['result']['result']['value']
            assert current_value == 'beta'


class TestCoreTypeText:
    """Integration tests for type_text (keyboard-based input)."""

    @pytest.mark.asyncio
    async def test_type_text_into_input(self, ci_chrome_options):
        """type_text should insert characters via keyboard events."""
        test_file = Path(__file__).parent / 'pages' / 'test_core_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(0.5)

            input_el = await tab.find(id='text-input')
            await input_el.type_text('hello123')
            await asyncio.sleep(0.3)

            prop = await input_el.execute_script('return this.value', return_by_value=True)
            assert prop['result']['result']['value'] == 'hello123'

    @pytest.mark.asyncio
    async def test_type_text_humanized_into_input(self, ci_chrome_options):
        """type_text with humanize=True should produce the same result."""
        test_file = Path(__file__).parent / 'pages' / 'test_core_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(0.5)

            input_el = await tab.find(id='text-input')
            await input_el.type_text('Test!', humanize=True)
            await asyncio.sleep(0.3)

            prop = await input_el.execute_script('return this.value', return_by_value=True)
            value = prop['result']['result']['value']
            # Humanized typing may introduce and correct typos,
            # but the final value should be very close to the input.
            # At minimum, length should be reasonable.
            assert len(value) >= 3

    @pytest.mark.asyncio
    async def test_type_text_symbols_and_punctuation(self, ci_chrome_options):
        """type_text should handle symbols, digits, and punctuation."""
        test_file = Path(__file__).parent / 'pages' / 'test_core_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(0.5)

            input_el = await tab.find(id='text-input')
            test_text = 'user@example.com'
            await input_el.type_text(test_text)
            await asyncio.sleep(0.3)

            prop = await input_el.execute_script('return this.value', return_by_value=True)
            assert prop['result']['result']['value'] == test_text

    @pytest.mark.asyncio
    @pytest.mark.parametrize(
        'text,label',
        [
            ('abcdefghijklmnopqrstuvwxyz', 'lowercase'),
            ('ABCDEFGHIJKLMNOPQRSTUVWXYZ', 'uppercase'),
            ('0123456789', 'digits'),
            ('-=[];\',./', 'punctuation_unshifted'),
            ('!@#$%^&*()_+{}|:"<>?~', 'punctuation_shifted'),
        ],
    )
    async def test_type_text_all_character_groups(self, ci_chrome_options, text, label):
        """type_text should correctly type every mapped character group."""
        test_file = Path(__file__).parent / 'pages' / 'test_core_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(0.5)

            input_el = await tab.find(id='text-input')
            await input_el.type_text(text)
            await asyncio.sleep(0.3)

            prop = await input_el.execute_script('return this.value', return_by_value=True)
            assert prop['result']['result']['value'] == text, f'Failed for {label}: {text!r}'


================================================
FILE: tests/test_decorators.py
================================================
"""Tests for the retry decorator."""

import asyncio
import pytest
import pytest_asyncio
from unittest.mock import AsyncMock, MagicMock, call

from pydoll.decorators import retry, RetryConfig
from pydoll.exceptions import (
    ElementNotFound,
    WaitElementTimeout,
    NetworkError,
    PydollException,
)


class TestRetryConfigInitialization:
    """Test RetryConfig initialization."""

    def test_default_initialization(self):
        """Test RetryConfig is properly initialized with defaults."""
        config = RetryConfig()
        assert config.max_retries == 5
        assert config.exceptions == Exception
        assert config.on_retry is None
        assert config.delay == 0
        assert config.exponential_backoff is False

    def test_custom_initialization(self):
        """Test RetryConfig with custom parameters."""
        callback = AsyncMock()
        config = RetryConfig(
            max_retries=3,
            exceptions=[ElementNotFound, NetworkError],
            on_retry=callback,
            delay=2.0,
            exponential_backoff=True,
        )
        assert config.max_retries == 3
        assert config.exceptions == [ElementNotFound, NetworkError]
        assert config.on_retry == callback
        assert config.delay == 2.0
        assert config.exponential_backoff is True


class TestRetryConfigCalculateDelay:
    """Test delay calculation methods."""

    def test_no_delay(self):
        """Test calculate_delay with zero delay."""
        config = RetryConfig(delay=0)
        assert config.calculate_delay(1) == 0
        assert config.calculate_delay(5) == 0

    def test_constant_delay(self):
        """Test calculate_delay without exponential backoff."""
        config = RetryConfig(delay=2.0, exponential_backoff=False)
        assert config.calculate_delay(0) == 2.0
        assert config.calculate_delay(1) == 2.0
        assert config.calculate_delay(2) == 2.0

    def test_exponential_backoff(self):
        """Test calculate_delay with exponential backoff."""
        config = RetryConfig(delay=1.0, exponential_backoff=True)
        assert config.calculate_delay(0) == 1.0  # 1 * 2^0 = 1
        assert config.calculate_delay(1) == 2.0  # 1 * 2^1 = 2
        assert config.calculate_delay(2) == 4.0  # 1 * 2^2 = 4
        assert config.calculate_delay(3) == 8.0  # 1 * 2^3 = 8


class TestRetryConfigIsMatchingException:
    """Test exception matching logic."""

    def test_single_exception_match(self):
        """Test matching with single exception type."""
        config = RetryConfig(exceptions=ElementNotFound)
        assert config.is_matching_exception(ElementNotFound("test"))
        assert not config.is_matching_exception(NetworkError("test"))

    def test_list_exception_match(self):
        """Test matching with list of exception types."""
        config = RetryConfig(exceptions=[ElementNotFound, NetworkError])
        assert config.is_matching_exception(ElementNotFound("test"))
        assert config.is_matching_exception(NetworkError("test"))
        assert not config.is_matching_exception(WaitElementTimeout("test"))

    def test_parent_exception_match(self):
        """Test matching with parent exception class."""
        config = RetryConfig(exceptions=PydollException)
        assert config.is_matching_exception(ElementNotFound("test"))
        assert config.is_matching_exception(NetworkError("test"))
        assert not config.is_matching_exception(ValueError("test"))


class TestRetryConfigCallCallback:
    """Test on_retry callback execution."""

    @pytest.mark.asyncio
    async def test_no_callback(self):
        """Test call_callback with no callback set."""
        config = RetryConfig(on_retry=None)
        # Should not raise any error
        await config.call_callback(None)

    @pytest.mark.asyncio
    async def test_callback_with_instance(self):
        """Test callback receiving instance argument."""
        callback = AsyncMock()
        config = RetryConfig(on_retry=callback)
        
        instance = MagicMock()
        await config.call_callback(instance)
        
        callback.assert_called_once_with(instance)

    @pytest.mark.asyncio
    async def test_callback_without_instance(self):
        """Test callback that doesn't accept instance argument."""
        # Callback that doesn't accept arguments
        callback_called = False
        
        async def simple_callback():
            nonlocal callback_called
            callback_called = True
        
        config = RetryConfig(on_retry=simple_callback)
        await config.call_callback(MagicMock())
        
        assert callback_called


class TestRetryDecoratorBasic:
    """Test basic retry decorator functionality."""

    @pytest.mark.asyncio
    async def test_successful_execution_no_retry(self):
        """Test function succeeds on first try."""
        call_count = 0
        
        @retry(max_retries=3, exceptions=[ElementNotFound])
        async def successful_function():
            nonlocal call_count
            call_count += 1
            return "success"
        
        result = await successful_function()
        assert result == "success"
        assert call_count == 1

    @pytest.mark.asyncio
    async def test_retry_on_matching_exception(self):
        """Test retry occurs when matching exception is raised."""
        call_count = 0
        
        @retry(max_retries=2, exceptions=[ElementNotFound], delay=0)
        async def failing_function():
            nonlocal call_count
            call_count += 1
            if call_count < 3:
                raise ElementNotFound("Element not found")
            return "success"
        
        result = await failing_function()
        assert result == "success"
        # max_retries=2 means 3 attempts (1 original + 2 retries)
        assert call_count == 3

    @pytest.mark.asyncio
    async def test_no_retry_on_non_matching_exception(self):
        """Test no retry when non-matching exception is raised."""
        call_count = 0
        
        @retry(max_retries=3, exceptions=[ElementNotFound], delay=0)
        async def failing_function():
            nonlocal call_count
            call_count += 1
            raise NetworkError("Network error")
        
        with pytest.raises(NetworkError):
            await failing_function()
        
        assert call_count == 1

    @pytest.mark.asyncio
    async def test_exhaust_all_retries(self):
        """Test all retries are exhausted before raising."""
        call_count = 0
        
        @retry(max_retries=2, exceptions=[ElementNotFound], delay=0)
        async def always_failing():
            nonlocal call_count
            call_count += 1
            raise ElementNotFound("Always fails")
        
        with pytest.raises(ElementNotFound):
            await always_failing()
        
        # max_retries=2 means 3 attempts (1 original + 2 retries)
        assert call_count == 3


class TestRetryDecoratorWithMultipleExceptions:
    """Test retry with multiple exception types."""

    @pytest.mark.asyncio
    async def test_retry_on_any_listed_exception(self):
        """Test retry occurs for any exception in the list."""
        exceptions_raised = []
        
        @retry(
            max_retries=3,
            exceptions=[ElementNotFound, NetworkError, WaitElementTimeout],
            delay=0
        )
        async def multi_exception_function():
            if len(exceptions_raised) == 0:
                exceptions_raised.append("ElementNotFound")
                raise ElementNotFound("First error")
            elif len(exceptions_raised) == 1:
                exceptions_raised.append("NetworkError")
                raise NetworkError("Second error")
            elif len(exceptions_raised) == 2:
                exceptions_raised.append("WaitElementTimeout")
                raise WaitElementTimeout("Third error")
            return "success"
        
        result = await multi_exception_function()
        assert result == "success"
        # max_retries=3 means 4 attempts total, success on 4th
        assert len(exceptions_raised) == 3


class TestRetryDecoratorWithDelay:
    """Test retry with delay between attempts."""

    @pytest.mark.asyncio
    async def test_constant_delay(self):
        """Test constant delay between retries."""
        call_times = []
        
        @retry(max_retries=2, exceptions=[ElementNotFound], delay=0.1)
        async def delayed_function():
            call_times.append(asyncio.get_event_loop().time())
            if len(call_times) < 3:
                raise ElementNotFound("Retry")
            return "success"
        
        await delayed_function()
        
        # max_retries=2 means 3 attempts (1 original + 2 retries)
        assert len(call_times) == 3
        # Check delays between calls (should be ~0.1s)
        # Allow 50ms tolerance for timing
        assert call_times[1] - call_times[0] >= 0.05
        assert call_times[2] - call_times[1] >= 0.05

    @pytest.mark.asyncio
    async def test_exponential_backoff(self):
        """Test exponential backoff increases delay."""
        call_times = []
        
        @retry(
            max_retries=3,
            exceptions=[ElementNotFound],
            delay=0.1,
            exponential_backoff=True
        )
        async def exponential_function():
            call_times.append(asyncio.get_event_loop().time())
            if len(call_times) < 4:
                raise ElementNotFound("Retry")
            return "success"
        
        await exponential_function()
        
        # max_retries=3 means 4 attempts (1 original + 3 retries)
        assert len(call_times) == 4
        # First delay: ~0.1s (2^0 * 0.1)
        # Second delay: ~0.2s (2^1 * 0.1)
        # Third delay: ~0.4s (2^2 * 0.1)
        delay1 = call_times[1] - call_times[0]
        delay2 = call_times[2] - call_times[1]
        delay3 = call_times[3] - call_times[2]
        
        # Each delay should roughly double (with tolerance)
        assert delay2 > delay1 * 1.5
        assert delay3 > delay2 * 1.5


class TestRetryDecoratorWithCallback:
    """Test retry with on_retry callback."""

    @pytest.mark.asyncio
    async def test_callback_called_on_retry(self):
        """Test callback is called before each retry."""
        callback_count = 0
        
        async def retry_callback():
            nonlocal callback_count
            callback_count += 1
        
        call_count = 0
        
        @retry(
            max_retries=2,
            exceptions=[ElementNotFound],
            on_retry=retry_callback,
            delay=0
        )
        async def function_with_callback():
            nonlocal call_count
            call_count += 1
            if call_count < 3:
                raise ElementNotFound("Retry")
            return "success"
        
        await function_with_callback()
        
        # max_retries=2 means 3 attempts (1 original + 2 retries)
        # Function called 3 times, callback called 2 times (before retry 1 and 2)
        assert call_count == 3
        assert callback_count == 2

    @pytest.mark.asyncio
    async def test_callback_receives_instance(self):
        """Test callback receives instance when used with class method."""
        class TestClass:
            def __init__(self):
                self.callback_count = 0
                self.instance_received = None
                self.call_count = 0
            
            async def recovery_callback(self):
                self.callback_count += 1
                self.instance_received = self
            
            @retry(
                max_retries=2,
                exceptions=[ElementNotFound],
                on_retry=recovery_callback,
                delay=0
            )
            async def method_with_callback(self):
                self.call_count += 1
                if self.call_count < 3:
                    raise ElementNotFound("Retry")
                return "success"
        
        instance = TestClass()
        result = await instance.method_with_callback()
        
        assert result == "success"
        # max_retries=2 means 3 attempts, callback called 2 times
        assert instance.callback_count == 2
        assert instance.instance_received is instance


class TestRetryDecoratorEdgeCases:
    """Test edge cases and error conditions."""

    @pytest.mark.asyncio
    async def test_zero_retries_succeeds(self):
        """Test with max_retries=0 succeeds on first attempt."""
        call_count = 0
        
        @retry(max_retries=0, exceptions=[ElementNotFound], delay=0)
        async def zero_retry_function():
            nonlocal call_count
            call_count += 1
            return "success"
        
        result = await zero_retry_function()
        assert result == "success"
        # max_retries=0 means 1 attempt (no retries)
        assert call_count == 1

    @pytest.mark.asyncio
    async def test_zero_retries_fails_immediately(self):
        """Test with max_retries=0 fails without retry."""
        call_count = 0
        
        @retry(max_retries=0, exceptions=[ElementNotFound], delay=0)
        async def zero_retry_function():
            nonlocal call_count
            call_count += 1
            raise ElementNotFound("Fail")
        
        with pytest.raises(ElementNotFound):
            await zero_retry_function()
        
        # max_retries=0 means 1 attempt, no retries
        assert call_count == 1

    @pytest.mark.asyncio
    async def test_one_retry_succeeds_on_second_attempt(self):
        """Test with max_retries=1 succeeds on second attempt."""
        call_count = 0
        
        @retry(max_retries=1, exceptions=[ElementNotFound], delay=0)
        async def one_retry_function():
            nonlocal call_count
            call_count += 1
            if call_count == 1:
                raise ElementNotFound("Fail")
            return "success"
        
        result = await one_retry_function()
        assert result == "success"
        # max_retries=1 means 2 attempts (1 original + 1 retry)
        assert call_count == 2

    @pytest.mark.asyncio
    async def test_exception_to_raise_parameter(self):
        """Test custom exception can be raised instead of original."""
        call_count = 0
        
        custom_exception = NetworkError("Custom error message")
        
        @retry(
            max_retries=1,
            exceptions=[ElementNotFound],
            delay=0,
            exception_to_raise=custom_exception
        )
        async def function_with_custom_exception():
            nonlocal call_count
            call_count += 1
            raise ElementNotFound("Original error")
        
        with pytest.raises(NetworkError) as exc_info:
            await function_with_custom_exception()
        
        assert str(exc_info.value) == "Custom error message"
        # max_retries=1 means 2 attempts (1 original + 1 retry)
        assert call_count == 2


class TestRetryDecoratorWithClassMethods:
    """Test retry decorator with class methods."""

    @pytest.mark.asyncio
    async def test_instance_method(self):
        """Test decorator on instance method."""
        class Counter:
            def __init__(self):
                self.count = 0
            
            @retry(max_retries=2, exceptions=[ElementNotFound], delay=0)
            async def increment(self):
                self.count += 1
                if self.count < 3:
                    raise ElementNotFound("Retry")
                return self.count
        
        counter = Counter()
        result = await counter.increment()
        
        # max_retries=2 means 3 attempts (1 original + 2 retries)
        assert result == 3
        assert counter.count == 3

    @pytest.mark.asyncio
    async def test_method_with_arguments(self):
        """Test decorated method with arguments."""
        class Calculator:
            @retry(max_retries=3, exceptions=[ValueError], delay=0)
            async def divide(self, a: int, b: int):
                if b == 0:
                    raise ValueError("Division by zero")
                return a / b
        
        calc = Calculator()
        result = await calc.divide(10, 2)
        assert result == 5.0

    @pytest.mark.asyncio
    async def test_method_with_state_restoration(self):
        """Test method that restores state in callback."""
        class StatefulClass:
            def __init__(self):
                self.attempts = 0
                self.state = "initial"
            
            async def restore_state(self):
                self.state = "restored"
            
            @retry(
                max_retries=2,
                exceptions=[ElementNotFound],
                on_retry=restore_state,
                delay=0
            )
            async def process(self):
                self.attempts += 1
                if self.attempts < 3:
                    self.state = "broken"
                    raise ElementNotFound("Retry")
                return "success"
        
        obj = StatefulClass()
        result = await obj.process()
        
        assert result == "success"
        # max_retries=2 means 3 attempts (1 original + 2 retries)
        assert obj.attempts == 3
        assert obj.state == "restored"


class TestRetryConfigHandleDelay:
    """Test handle_delay method."""

    @pytest.mark.asyncio
    async def test_handle_delay_no_delay(self):
        """Test handle_delay with zero delay."""
        config = RetryConfig(delay=0)
        
        start_time = asyncio.get_event_loop().time()
        await config.handle_delay(1)
        end_time = asyncio.get_event_loop().time()
        
        # Should be nearly instant
        assert end_time - start_time < 0.01

    @pytest.mark.asyncio
    async def test_handle_delay_with_delay(self):
        """Test handle_delay waits for specified time."""
        config = RetryConfig(delay=0.1, exponential_backoff=False)
        
        start_time = asyncio.get_event_loop().time()
        await config.handle_delay(1)
        end_time = asyncio.get_event_loop().time()
        
        # Should wait approximately 0.1 seconds
        assert end_time - start_time >= 0.05


class TestRetryDecoratorRealWorldScenarios:
    """Test real-world usage scenarios."""

    @pytest.mark.asyncio
    async def test_network_retry_scenario(self):
        """Simulate network retry scenario."""
        class NetworkClient:
            def __init__(self):
                self.attempt_count = 0
                self.reconnect_count = 0
            
            async def reconnect(self):
                """Simulate reconnection logic."""
                await asyncio.sleep(0.01)
                self.reconnect_count += 1
            
            @retry(
                max_retries=2,
                exceptions=[NetworkError],
                on_retry=reconnect,
                delay=0.05,
                exponential_backoff=True
            )
            async def fetch_data(self, url: str):
                self.attempt_count += 1
                # Fail on first 2 attempts, succeed on 3rd
                if self.attempt_count < 3:
                    raise NetworkError(f"Connection failed (attempt {self.attempt_count})")
                return f"Data from {url}"
        
        client = NetworkClient()
        result = await client.fetch_data("https://example.com")
        
        assert result == "Data from https://example.com"
        # max_retries=2 means 3 attempts (1 original + 2 retries)
        assert client.attempt_count == 3
        # Callback called 2 times (before retry 1 and retry 2)
        assert client.reconnect_count == 2

    @pytest.mark.asyncio
    async def test_element_search_retry_scenario(self):
        """Simulate element search with page refresh."""
        class PageScraper:
            def __init__(self):
                self.page_refreshed = False
                self.search_count = 0
            
            async def refresh_page(self):
                """Simulate page refresh."""
                await asyncio.sleep(0.01)
                self.page_refreshed = True
            
            @retry(
                max_retries=2,
                exceptions=[ElementNotFound, WaitElementTimeout],
                on_retry=refresh_page,
                delay=0.05
            )
            async def find_element(self, selector: str):
                self.search_count += 1
                if not self.page_refreshed:
                    raise ElementNotFound(f"Element '{selector}' not found")
                return f"Element: {selector}"
        
        scraper = PageScraper()
        result = await scraper.find_element("#content")
        
        assert result == "Element: #content"
        # max_retries=2 means up to 3 attempts, succeeds on 2nd
        assert scraper.search_count == 2
        assert scraper.page_refreshed is True


================================================
FILE: tests/test_events.py
================================================
from pydoll.protocol.browser.events import BrowserEvent
from pydoll.protocol.dom.events import DomEvent
from pydoll.protocol.fetch.events import FetchEvent
from pydoll.protocol.input.events import InputEvent
from pydoll.protocol.network.events import NetworkEvent
from pydoll.protocol.page.events import PageEvent
from pydoll.protocol.runtime.events import RuntimeEvent
from pydoll.protocol.storage.events import StorageEvent
from pydoll.protocol.target.events import TargetEvent


def test_browser_events():
    """Test all BrowserEvent enum values."""
    assert BrowserEvent.DOWNLOAD_PROGRESS == 'Browser.downloadProgress'
    assert BrowserEvent.DOWNLOAD_WILL_BEGIN == 'Browser.downloadWillBegin'


def test_dom_events():
    """Test all DomEvent enum values."""
    assert DomEvent.ATTRIBUTE_MODIFIED == 'DOM.attributeModified'
    assert DomEvent.ATTRIBUTE_REMOVED == 'DOM.attributeRemoved'
    assert DomEvent.CHARACTER_DATA_MODIFIED == 'DOM.characterDataModified'
    assert DomEvent.CHILD_NODE_COUNT_UPDATED == 'DOM.childNodeCountUpdated'
    assert DomEvent.CHILD_NODE_INSERTED == 'DOM.childNodeInserted'
    assert DomEvent.CHILD_NODE_REMOVED == 'DOM.childNodeRemoved'
    assert DomEvent.DOCUMENT_UPDATED == 'DOM.documentUpdated'
    assert DomEvent.SET_CHILD_NODES == 'DOM.setChildNodes'
    assert DomEvent.DISTRIBUTED_NODES_UPDATED == 'DOM.distributedNodesUpdated'
    assert DomEvent.INLINE_STYLE_INVALIDATED == 'DOM.inlineStyleInvalidated'
    assert DomEvent.PSEUDO_ELEMENT_ADDED == 'DOM.pseudoElementAdded'
    assert DomEvent.PSEUDO_ELEMENT_REMOVED == 'DOM.pseudoElementRemoved'
    assert DomEvent.SCROLLABLE_FLAG_UPDATED == 'DOM.scrollableFlagUpdated'
    assert DomEvent.SHADOW_ROOT_POPPED == 'DOM.shadowRootPopped'
    assert DomEvent.SHADOW_ROOT_PUSHED == 'DOM.shadowRootPushed'
    assert DomEvent.TOP_LAYER_ELEMENTS_UPDATED == 'DOM.topLayerElementsUpdated'


def test_fetch_events():
    """Test all FetchEvent enum values."""
    assert FetchEvent.AUTH_REQUIRED == 'Fetch.authRequired'
    assert FetchEvent.REQUEST_PAUSED == 'Fetch.requestPaused'


def test_input_events():
    """Test all InputEvent enum values."""
    assert InputEvent.DRAG_INTERCEPTED == 'Input.dragIntercepted'


def test_network_events():
    """Test all NetworkEvent enum values."""
    assert NetworkEvent.DATA_RECEIVED == 'Network.dataReceived'
    assert NetworkEvent.EVENT_SOURCE_MESSAGE_RECEIVED == 'Network.eventSourceMessageReceived'
    assert NetworkEvent.LOADING_FAILED == 'Network.loadingFailed'
    assert NetworkEvent.LOADING_FINISHED == 'Network.loadingFinished'
    assert NetworkEvent.REQUEST_SERVED_FROM_CACHE == 'Network.requestServedFromCache'
    assert NetworkEvent.REQUEST_WILL_BE_SENT == 'Network.requestWillBeSent'
    assert NetworkEvent.RESPONSE_RECEIVED == 'Network.responseReceived'
    assert NetworkEvent.WEBSOCKET_CLOSED == 'Network.webSocketClosed'
    assert NetworkEvent.WEBSOCKET_CREATED == 'Network.webSocketCreated'
    assert NetworkEvent.WEBSOCKET_FRAME_ERROR == 'Network.webSocketFrameError'
    assert NetworkEvent.WEBSOCKET_FRAME_RECEIVED == 'Network.webSocketFrameReceived'
    assert NetworkEvent.WEBSOCKET_FRAME_SENT == 'Network.webSocketFrameSent'
    assert NetworkEvent.WEBSOCKET_HANDSHAKE_RESPONSE_RECEIVED == 'Network.webSocketHandshakeResponseReceived'
    assert NetworkEvent.WEBSOCKET_WILL_SEND_HANDSHAKE_REQUEST == 'Network.webSocketWillSendHandshakeRequest'
    assert NetworkEvent.WEBTRANSPORT_CLOSED == 'Network.webTransportClosed'
    assert NetworkEvent.WEBTRANSPORT_CONNECTION_ESTABLISHED == 'Network.webTransportConnectionEstablished'
    assert NetworkEvent.WEBTRANSPORT_CREATED == 'Network.webTransportCreated'
    assert NetworkEvent.DIRECT_TCP_SOCKET_ABORTED == 'Network.directTCPSocketAborted'
    assert NetworkEvent.DIRECT_TCP_SOCKET_CHUNK_RECEIVED == 'Network.directTCPSocketChunkReceived'
    assert NetworkEvent.DIRECT_TCP_SOCKET_CHUNK_SENT == 'Network.directTCPSocketChunkSent'
    assert NetworkEvent.DIRECT_TCP_SOCKET_CLOSED == 'Network.directTCPSocketClosed'
    assert NetworkEvent.DIRECT_TCP_SOCKET_CREATED == 'Network.directTCPSocketCreated'
    assert NetworkEvent.DIRECT_TCP_SOCKET_OPENED == 'Network.directTCPSocketOpened'
    assert NetworkEvent.DIRECT_UDP_SOCKET_ABORTED == 'Network.directUDPSocketAborted'
    assert NetworkEvent.DIRECT_UDP_SOCKET_CHUNK_RECEIVED == 'Network.directUDPSocketChunkReceived'
    assert NetworkEvent.DIRECT_UDP_SOCKET_CHUNK_SENT == 'Network.directUDPSocketChunkSent'
    assert NetworkEvent.DIRECT_UDP_SOCKET_CLOSED == 'Network.directUDPSocketClosed'
    assert NetworkEvent.DIRECT_UDP_SOCKET_CREATED == 'Network.directUDPSocketCreated'
    assert NetworkEvent.DIRECT_UDP_SOCKET_OPENED == 'Network.directUDPSocketOpened'
    assert NetworkEvent.POLICY_UPDATED == 'Network.policyUpdated'
    assert NetworkEvent.REPORTING_API_ENDPOINTS_CHANGED_FOR_ORIGIN == 'Network.reportingApiEndpointsChangedForOrigin'
    assert NetworkEvent.REPORTING_API_REPORT_ADDED == 'Network.reportingApiReportAdded'
    assert NetworkEvent.REPORTING_API_REPORT_UPDATED == 'Network.reportingApiReportUpdated'
    assert NetworkEvent.REQUEST_WILL_BE_SENT_EXTRA_INFO == 'Network.requestWillBeSentExtraInfo'
    assert NetworkEvent.RESOURCE_CHANGED_PRIORITY == 'Network.resourceChangedPriority'
    assert NetworkEvent.RESPONSE_RECEIVED_EARLY_HINTS == 'Network.responseReceivedEarlyHints'
    assert NetworkEvent.RESPONSE_RECEIVED_EXTRA_INFO == 'Network.responseReceivedExtraInfo'
    assert NetworkEvent.SIGNED_EXCHANGE_RECEIVED == 'Network.signedExchangeReceived'
    assert NetworkEvent.SUBRESOURCE_WEB_BUNDLE_INNER_RESPONSE_ERROR == 'Network.subresourceWebBundleInnerResponseError'
    assert NetworkEvent.SUBRESOURCE_WEB_BUNDLE_INNER_RESPONSE_PARSED == 'Network.subresourceWebBundleInnerResponseParsed'
    assert NetworkEvent.SUBRESOURCE_WEB_BUNDLE_METADATA_ERROR == 'Network.subresourceWebBundleMetadataError'
    assert NetworkEvent.SUBRESOURCE_WEB_BUNDLE_METADATA_RECEIVED == 'Network.subresourceWebBundleMetadataReceived'
    assert NetworkEvent.TRUST_TOKEN_OPERATION_DONE == 'Network.trustTokenOperationDone'


def test_page_events():
    """Test all PageEvent enum values."""
    assert PageEvent.DOM_CONTENT_EVENT_FIRED == 'Page.domContentEventFired'
    assert PageEvent.FILE_CHOOSER_OPENED == 'Page.fileChooserOpened'
    assert PageEvent.FRAME_ATTACHED == 'Page.frameAttached'
    assert PageEvent.FRAME_DETACHED == 'Page.frameDetached'
    assert PageEvent.FRAME_NAVIGATED == 'Page.frameNavigated'
    assert PageEvent.INTERSTITIAL_HIDDEN == 'Page.interstitialHidden'
    assert PageEvent.INTERSTITIAL_SHOWN == 'Page.interstitialShown'
    assert PageEvent.JAVASCRIPT_DIALOG_CLOSED == 'Page.javascriptDialogClosed'
    assert PageEvent.JAVASCRIPT_DIALOG_OPENING == 'Page.javascriptDialogOpening'
    assert PageEvent.LIFECYCLE_EVENT == 'Page.lifecycleEvent'
    assert PageEvent.LOAD_EVENT_FIRED == 'Page.loadEventFired'
    assert PageEvent.WINDOW_OPEN == 'Page.windowOpen'
    assert PageEvent.BACK_FORWARD_CACHE_NOT_USED == 'Page.backForwardCacheNotUsed'
    assert PageEvent.COMPILATION_CACHE_PRODUCED == 'Page.compilationCacheProduced'
    assert PageEvent.DOCUMENT_OPENED == 'Page.documentOpened'
    assert PageEvent.FRAME_REQUESTED_NAVIGATION == 'Page.frameRequestedNavigation'
    assert PageEvent.FRAME_RESIZED == 'Page.frameResized'
    assert PageEvent.FRAME_STARTED_LOADING == 'Page.frameStartedLoading'
    assert PageEvent.FRAME_STARTED_NAVIGATING == 'Page.frameStartedNavigating'
    assert PageEvent.FRAME_STOPPED_LOADING == 'Page.frameStoppedLoading'
    assert PageEvent.FRAME_SUBTREE_WILL_BE_DETACHED == 'Page.frameSubtreeWillBeDetached'
    assert PageEvent.NAVIGATED_WITHIN_DOCUMENT == 'Page.navigatedWithinDocument'
    assert PageEvent.SCREENCAST_FRAME == 'Page.screencastFrame'
    assert PageEvent.SCREENCAST_VISIBILITY_CHANGED == 'Page.screencastVisibilityChanged'


def test_runtime_events():
    """Test all RuntimeEvent enum values."""
    assert RuntimeEvent.CONSOLE_API_CALLED == 'Runtime.consoleAPICalled'
    assert RuntimeEvent.EXCEPTION_REVOKED == 'Runtime.exceptionRevoked'
    assert RuntimeEvent.EXCEPTION_THROWN == 'Runtime.exceptionThrown'
    assert RuntimeEvent.EXECUTION_CONTEXT_CREATED == 'Runtime.executionContextCreated'
    assert RuntimeEvent.EXECUTION_CONTEXT_DESTROYED == 'Runtime.executionContextDestroyed'
    assert RuntimeEvent.EXECUTION_CONTEXTS_CLEARED == 'Runtime.executionContextsCleared'
    assert RuntimeEvent.INSPECT_REQUESTED == 'Runtime.inspectRequested'
    assert RuntimeEvent.BINDING_CALLED == 'Runtime.bindingCalled'


def test_storage_events():
    """Test all StorageEvent enum values."""
    assert StorageEvent.CACHE_STORAGE_CONTENT_UPDATED == 'Storage.cacheStorageContentUpdated'
    assert StorageEvent.CACHE_STORAGE_LIST_UPDATED == 'Storage.cacheStorageListUpdated'
    assert StorageEvent.INDEXED_DB_CONTENT_UPDATED == 'Storage.indexedDBContentUpdated'
    assert StorageEvent.INDEXED_DB_LIST_UPDATED == 'Storage.indexedDBListUpdated'
    assert StorageEvent.INTEREST_GROUP_ACCESSED == 'Storage.interestGroupAccessed'
    assert StorageEvent.INTEREST_GROUP_AUCTION_EVENT_OCCURRED == 'Storage.interestGroupAuctionEventOccurred'
    assert StorageEvent.INTEREST_GROUP_AUCTION_NETWORK_REQUEST_CREATED == 'Storage.interestGroupAuctionNetworkRequestCreated'
    assert StorageEvent.SHARED_STORAGE_ACCESSED == 'Storage.sharedStorageAccessed'
    assert StorageEvent.SHARED_STORAGE_WORKLET_OPERATION_EXECUTION_FINISHED == 'Storage.sharedStorageWorkletOperationExecutionFinished'
    assert StorageEvent.STORAGE_BUCKET_CREATED_OR_UPDATED == 'Storage.storageBucketCreatedOrUpdated'
    assert StorageEvent.STORAGE_BUCKET_DELETED == 'Storage.storageBucketDeleted'
    assert StorageEvent.ATTRIBUTION_REPORTING_REPORT_SENT == 'Storage.attributionReportingReportSent'
    assert StorageEvent.ATTRIBUTION_REPORTING_SOURCE_REGISTERED == 'Storage.attributionReportingSourceRegistered'
    assert StorageEvent.ATTRIBUTION_REPORTING_TRIGGER_REGISTERED == 'Storage.attributionReportingTriggerRegistered'


def test_target_events():
    """Test all TargetEvent enum values."""
    assert TargetEvent.RECEIVED_MESSAGE_FROM_TARGET == 'Target.receivedMessageFromTarget'
    assert TargetEvent.TARGET_CRASHED == 'Target.targetCrashed'
    assert TargetEvent.TARGET_CREATED == 'Target.targetCreated'
    assert TargetEvent.TARGET_DESTROYED == 'Target.targetDestroyed'
    assert TargetEvent.TARGET_INFO_CHANGED == 'Target.targetInfoChanged'
    assert TargetEvent.ATTACHED_TO_TARGET == 'Target.attachedToTarget'
    assert TargetEvent.DETACHED_FROM_TARGET == 'Target.detachedFromTarget'


def test_event_enums_integrity():
    """Test that all event enums are properly structured and have no duplicates."""
    # Test that all enums inherit from str and Enum
    event_classes = [
        BrowserEvent, DomEvent, FetchEvent, InputEvent, NetworkEvent,
        PageEvent, RuntimeEvent, StorageEvent, TargetEvent
    ]
    
    # Map class names to their correct domain prefixes
    domain_mapping = {
        'BrowserEvent': 'Browser',
        'DomEvent': 'DOM',
        'FetchEvent': 'Fetch',
        'InputEvent': 'Input',
        'NetworkEvent': 'Network',
        'PageEvent': 'Page',
        'RuntimeEvent': 'Runtime',
        'StorageEvent': 'Storage',
        'TargetEvent': 'Target'
    }
    
    for event_class in event_classes:
        # Check that all values are strings
        for event in event_class:
            assert isinstance(event.value, str), f"{event_class.__name__}.{event.name} should be a string"
            
        # Check that all values start with the correct domain prefix
        domain_name = domain_mapping[event_class.__name__]
        for event in event_class:
            assert event.value.startswith(f'{domain_name}.'), \
                f"{event_class.__name__}.{event.name} should start with '{domain_name}.'"


def test_no_duplicate_events():
    """Test that there are no duplicate event values across all enums."""
    all_events = []

    event_classes = [
        BrowserEvent, DomEvent, FetchEvent, InputEvent, NetworkEvent,
        PageEvent, RuntimeEvent, StorageEvent, TargetEvent
    ]

    for event_class in event_classes:
        for event in event_class:
            all_events.append(event.value)

    assert len(all_events) == len(set(all_events)), "Found duplicate event values"


def test_event_enum_completeness():
    """Test that each event enum has at least one event defined."""
    event_classes = [
        BrowserEvent, DomEvent, FetchEvent, InputEvent, NetworkEvent,
        PageEvent, RuntimeEvent, StorageEvent, TargetEvent
    ]
    
    for event_class in event_classes:
        assert len(list(event_class)) > 0, f"{event_class.__name__} should have at least one event"


def test_event_naming_convention():
    """Test that all event names follow the correct naming convention."""
    event_classes = [
        BrowserEvent, DomEvent, FetchEvent, InputEvent, NetworkEvent,
        PageEvent, RuntimeEvent, StorageEvent, TargetEvent
    ]

    for event_class in event_classes:
        for event in event_class:
            # Event names should be UPPER_CASE
            assert event.name.isupper(), f"{event_class.__name__}.{event.name} should be uppercase"
            # Event names should not contain lowercase letters
            assert not any(c.islower() for c in event.name), \
                f"{event_class.__name__}.{event.name} should not contain lowercase letters"


================================================
FILE: tests/test_exceptions.py
================================================
import pytest
from pydoll.exceptions import (
    # Base exceptions
    PydollException,
    ConnectionException,
    BrowserException,
    ProtocolException,
    ElementException,
    TimeoutException,
    ConfigurationException,
    DialogException,
    
    # Connection exceptions
    ConnectionFailed,
    ReconnectionFailed,
    WebSocketConnectionClosed,
    NetworkError,
    
    # Browser exceptions
    BrowserNotRunning,
    FailedToStartBrowser,
    UnsupportedOS,
    NoValidTabFound,
    
    # Protocol exceptions
    InvalidCommand,
    InvalidResponse,
    ResendCommandFailed,
    CommandExecutionTimeout,
    InvalidCallback,
    EventNotSupported,
    
    # Element exceptions
    ElementNotFound,
    ElementNotVisible,
    ElementNotInteractable,
    ClickIntercepted,
    ElementNotAFileInput,
    
    # Timeout exceptions
    PageLoadTimeout,
    WaitElementTimeout,
    
    # Configuration exceptions
    InvalidOptionsObject,
    InvalidBrowserPath,
    ArgumentAlreadyExistsInOptions,
    InvalidFileExtension,
    
    # Dialog exceptions
    NoDialogPresent,
    
    # IFrame exceptions
    NotAnIFrame,
    InvalidIFrame,
    IFrameNotFound,
)


class TestBaseExceptions:
    """Test base exception classes."""

    def test_pydoll_exception_default_message(self):
        """Test PydollException with default message."""
        with pytest.raises(PydollException) as exc_info:
            raise PydollException()
        assert str(exc_info.value) == 'An error occurred in Pydoll'

    def test_pydoll_exception_custom_message(self):
        """Test PydollException with custom message."""
        custom_message = 'Custom error occurred'
        with pytest.raises(PydollException) as exc_info:
            raise PydollException(custom_message)
        assert str(exc_info.value) == custom_message

    def test_connection_exception_default(self):
        """Test ConnectionException with default message."""
        with pytest.raises(ConnectionException) as exc_info:
            raise ConnectionException()
        assert str(exc_info.value) == 'A connection error occurred'

    def test_connection_exception_custom(self):
        """Test ConnectionException with custom message."""
        custom_message = 'Custom connection error'
        with pytest.raises(ConnectionException) as exc_info:
            raise ConnectionException(custom_message)
        assert str(exc_info.value) == custom_message

    def test_browser_exception_default(self):
        """Test BrowserException with default message."""
        with pytest.raises(BrowserException) as exc_info:
            raise BrowserException()
        assert str(exc_info.value) == 'A browser error occurred'

    def test_protocol_exception_default(self):
        """Test ProtocolException with default message."""
        with pytest.raises(ProtocolException) as exc_info:
            raise ProtocolException()
        assert str(exc_info.value) == 'A protocol error occurred'

    def test_element_exception_default(self):
        """Test ElementException with default message."""
        with pytest.raises(ElementException) as exc_info:
            raise ElementException()
        assert str(exc_info.value) == 'An element interaction error occurred'

    def test_timeout_exception_default(self):
        """Test TimeoutException with default message."""
        with pytest.raises(TimeoutException) as exc_info:
            raise TimeoutException()
        assert str(exc_info.value) == 'A timeout occurred'

    def test_configuration_exception_default(self):
        """Test ConfigurationException with default message."""
        with pytest.raises(ConfigurationException) as exc_info:
            raise ConfigurationException()
        assert str(exc_info.value) == 'A configuration error occurred'

    def test_dialog_exception_default(self):
        """Test DialogException with default message."""
        with pytest.raises(DialogException) as exc_info:
            raise DialogException()
        assert str(exc_info.value) == 'A dialog error occurred'


class TestConnectionExceptions:
    """Test connection-related exceptions."""

    def test_connection_failed(self):
        """Test ConnectionFailed exception."""
        with pytest.raises(ConnectionFailed) as exc_info:
            raise ConnectionFailed()
        assert str(exc_info.value) == 'Failed to connect to the browser'

    def test_reconnection_failed(self):
        """Test ReconnectionFailed exception."""
        with pytest.raises(ReconnectionFailed) as exc_info:
            raise ReconnectionFailed()
        assert str(exc_info.value) == 'Failed to reconnect to the browser'

    def test_websocket_connection_closed(self):
        """Test WebSocketConnectionClosed exception."""
        with pytest.raises(WebSocketConnectionClosed) as exc_info:
            raise WebSocketConnectionClosed()
        assert str(exc_info.value) == 'The WebSocket connection is closed'

    def test_websocket_connection_closed_custom(self):
        """Test WebSocketConnectionClosed with custom message."""
        custom_message = 'Connection closed unexpectedly'
        with pytest.raises(WebSocketConnectionClosed) as exc_info:
            raise WebSocketConnectionClosed(custom_message)
        assert str(exc_info.value) == custom_message

    def test_network_error(self):
        """Test NetworkError exception."""
        with pytest.raises(NetworkError) as exc_info:
            raise NetworkError()
        assert str(exc_info.value) == 'A network error occurred'


class TestBrowserExceptions:
    """Test browser-related exceptions."""

    def test_browser_not_running(self):
        """Test BrowserNotRunning exception."""
        with pytest.raises(BrowserNotRunning) as exc_info:
            raise BrowserNotRunning()
        assert str(exc_info.value) == 'The browser is not running'

    def test_failed_to_start_browser(self):
        """Test FailedToStartBrowser exception."""
        with pytest.raises(FailedToStartBrowser) as exc_info:
            raise FailedToStartBrowser()
        assert str(exc_info.value) == 'Failed to start the browser'

    def test_failed_to_start_browser_custom(self):
        """Test FailedToStartBrowser with custom message."""
        custom_message = 'Browser executable not found'
        with pytest.raises(FailedToStartBrowser) as exc_info:
            raise FailedToStartBrowser(custom_message)
        assert str(exc_info.value) == custom_message

    def test_unsupported_os(self):
        """Test UnsupportedOS exception."""
        with pytest.raises(UnsupportedOS) as exc_info:
            raise UnsupportedOS()
        assert str(exc_info.value) == 'Unsupported OS'

    def test_unsupported_os_custom(self):
        """Test UnsupportedOS with custom message."""
        custom_message = 'This OS is not supported: FreeBSD'
        with pytest.raises(UnsupportedOS) as exc_info:
            raise UnsupportedOS(custom_message)
        assert str(exc_info.value) == custom_message

    def test_no_valid_tab_found(self):
        """Test NoValidTabFound exception."""
        with pytest.raises(NoValidTabFound) as exc_info:
            raise NoValidTabFound()
        assert str(exc_info.value) == 'No valid attached tab found'


class TestProtocolExceptions:
    """Test protocol-related exceptions."""

    def test_invalid_command(self):
        """Test InvalidCommand exception."""
        with pytest.raises(InvalidCommand) as exc_info:
            raise InvalidCommand()
        assert str(exc_info.value) == 'The command provided is invalid'

    def test_invalid_response(self):
        """Test InvalidResponse exception."""
        with pytest.raises(InvalidResponse) as exc_info:
            raise InvalidResponse()
        assert str(exc_info.value) == 'The response received is invalid'

    def test_resend_command_failed(self):
        """Test ResendCommandFailed exception."""
        with pytest.raises(ResendCommandFailed) as exc_info:
            raise ResendCommandFailed()
        assert str(exc_info.value) == 'Failed to resend the command'

    def test_command_execution_timeout(self):
        """Test CommandExecutionTimeout exception."""
        with pytest.raises(CommandExecutionTimeout) as exc_info:
            raise CommandExecutionTimeout()
        assert str(exc_info.value) == 'The command execution timed out'

    def test_command_execution_timeout_custom(self):
        """Test CommandExecutionTimeout with custom message."""
        custom_message = 'Command timed out after 30 seconds'
        with pytest.raises(CommandExecutionTimeout) as exc_info:
            raise CommandExecutionTimeout(custom_message)
        assert str(exc_info.value) == custom_message

    def test_invalid_callback(self):
        """Test InvalidCallback exception."""
        with pytest.raises(InvalidCallback) as exc_info:
            raise InvalidCallback()
        assert str(exc_info.value) == 'The callback provided is invalid'

    def test_event_not_supported(self):
        """Test EventNotSupported exception."""
        with pytest.raises(EventNotSupported) as exc_info:
            raise EventNotSupported('Custom error message')
        assert str(exc_info.value) == 'Custom error message'

        # Testing default message
        with pytest.raises(EventNotSupported) as exc_info:
            raise EventNotSupported()
        assert str(exc_info.value) == 'The event is not supported'


class TestElementExceptions:
    """Test element-related exceptions."""

    def test_element_not_found(self):
        """Test ElementNotFound exception."""
        with pytest.raises(ElementNotFound) as exc_info:
            raise ElementNotFound()
        assert str(exc_info.value) == 'The specified element was not found'

    def test_element_not_found_custom(self):
        """Test ElementNotFound with custom message."""
        custom_message = 'Button with ID "submit" not found'
        with pytest.raises(ElementNotFound) as exc_info:
            raise ElementNotFound(custom_message)
        assert str(exc_info.value) == custom_message

    def test_element_not_visible(self):
        """Test ElementNotVisible exception."""
        with pytest.raises(ElementNotVisible) as exc_info:
            raise ElementNotVisible()
        assert str(exc_info.value) == 'The element is not visible'

    def test_element_not_interactable(self):
        """Test ElementNotInteractable exception."""
        with pytest.raises(ElementNotInteractable) as exc_info:
            raise ElementNotInteractable()
        assert str(exc_info.value) == 'The element is not interactable'

    def test_click_intercepted(self):
        """Test ClickIntercepted exception."""
        with pytest.raises(ClickIntercepted) as exc_info:
            raise ClickIntercepted()
        assert str(exc_info.value) == 'The click was intercepted'

    def test_click_intercepted_custom(self):
        """Test ClickIntercepted with custom message."""
        custom_message = 'Click intercepted by overlay element'
        with pytest.raises(ClickIntercepted) as exc_info:
            raise ClickIntercepted(custom_message)
        assert str(exc_info.value) == custom_message

    def test_element_not_a_file_input(self):
        """Test ElementNotAFileInput exception."""
        with pytest.raises(ElementNotAFileInput) as exc_info:
            raise ElementNotAFileInput()
        assert str(exc_info.value) == 'The element is not a file input'

    def test_element_not_a_file_input_custom(self):
        """Test ElementNotAFileInput with custom message."""
        custom_message = 'Expected file input, got text input'
        with pytest.raises(ElementNotAFileInput) as exc_info:
            raise ElementNotAFileInput(custom_message)
        assert str(exc_info.value) == custom_message


class TestTimeoutExceptions:
    """Test timeout-related exceptions."""

    def test_page_load_timeout(self):
        """Test PageLoadTimeout exception."""
        with pytest.raises(PageLoadTimeout) as exc_info:
            raise PageLoadTimeout()
        assert str(exc_info.value) == 'Page load timed out'

    def test_page_load_timeout_custom(self):
        """Test PageLoadTimeout with custom message."""
        custom_message = 'Page load timed out after 30 seconds'
        with pytest.raises(PageLoadTimeout) as exc_info:
            raise PageLoadTimeout(custom_message)
        assert str(exc_info.value) == custom_message

    def test_wait_element_timeout(self):
        """Test WaitElementTimeout exception."""
        with pytest.raises(WaitElementTimeout) as exc_info:
            raise WaitElementTimeout()
        assert str(exc_info.value) == 'Timed out waiting for element to appear'

    def test_wait_element_timeout_custom(self):
        """Test WaitElementTimeout with custom message."""
        custom_message = 'Element with selector "#button" did not appear within 10 seconds'
        with pytest.raises(WaitElementTimeout) as exc_info:
            raise WaitElementTimeout(custom_message)
        assert str(exc_info.value) == custom_message


class TestConfigurationExceptions:
    """Test configuration-related exceptions."""

    def test_invalid_options_object(self):
        """Test InvalidOptionsObject exception."""
        with pytest.raises(InvalidOptionsObject) as exc_info:
            raise InvalidOptionsObject()
        assert str(exc_info.value) == 'The options object provided is invalid'

    def test_invalid_options_object_custom(self):
        """Test InvalidOptionsObject with custom message."""
        custom_message = 'Options must be a dictionary'
        with pytest.raises(InvalidOptionsObject) as exc_info:
            raise InvalidOptionsObject(custom_message)
        assert str(exc_info.value) == custom_message

    def test_invalid_browser_path(self):
        """Test InvalidBrowserPath exception."""
        with pytest.raises(InvalidBrowserPath) as exc_info:
            raise InvalidBrowserPath()
        assert str(exc_info.value) == 'The browser path provided is invalid'

    def test_invalid_browser_path_custom(self):
        """Test InvalidBrowserPath with custom message."""
        custom_message = 'Browser not found at /usr/bin/chrome'
        with pytest.raises(InvalidBrowserPath) as exc_info:
            raise InvalidBrowserPath(custom_message)
        assert str(exc_info.value) == custom_message

    def test_argument_already_exists_in_options(self):
        """Test ArgumentAlreadyExistsInOptions exception."""
        with pytest.raises(ArgumentAlreadyExistsInOptions) as exc_info:
            raise ArgumentAlreadyExistsInOptions()
        assert str(exc_info.value) == 'The argument already exists in the options'

    def test_argument_already_exists_custom(self):
        """Test ArgumentAlreadyExistsInOptions with custom message."""
        custom_message = 'Argument --headless already exists'
        with pytest.raises(ArgumentAlreadyExistsInOptions) as exc_info:
            raise ArgumentAlreadyExistsInOptions(custom_message)
        assert str(exc_info.value) == custom_message

    def test_invalid_file_extension(self):
        """Test InvalidFileExtension exception."""
        with pytest.raises(InvalidFileExtension) as exc_info:
            raise InvalidFileExtension()
        assert str(exc_info.value) == 'The file extension provided is not supported'


class TestDialogExceptions:
    """Test dialog-related exceptions."""

    def test_no_dialog_present(self):
        """Test NoDialogPresent exception."""
        with pytest.raises(NoDialogPresent) as exc_info:
            raise NoDialogPresent()
        assert str(exc_info.value) == 'No dialog present on the page'

    def test_no_dialog_present_custom(self):
        """Test NoDialogPresent with custom message."""
        custom_message = 'Expected alert dialog but none found'
        with pytest.raises(NoDialogPresent) as exc_info:
            raise NoDialogPresent(custom_message)
        assert str(exc_info.value) == custom_message


class TestIFrameExceptions:
    """Test iframe-related exceptions."""

    def test_not_an_iframe(self):
        """Test NotAnIFrame exception."""
        with pytest.raises(NotAnIFrame) as exc_info:
            raise NotAnIFrame()
        assert str(exc_info.value) == 'The element is not an iframe'

    def test_not_an_iframe_custom(self):
        """Test NotAnIFrame with custom message."""
        custom_message = 'Expected iframe element, got div'
        with pytest.raises(NotAnIFrame) as exc_info:
            raise NotAnIFrame(custom_message)
        assert str(exc_info.value) == custom_message

    def test_invalid_iframe(self):
        """Test InvalidIFrame exception."""
        with pytest.raises(InvalidIFrame) as exc_info:
            raise InvalidIFrame()
        assert str(exc_info.value) == 'The iframe is not valid'

    def test_invalid_iframe_custom(self):
        """Test InvalidIFrame with custom message."""
        custom_message = 'IFrame has no src attribute'
        with pytest.raises(InvalidIFrame) as exc_info:
            raise InvalidIFrame(custom_message)
        assert str(exc_info.value) == custom_message

    def test_iframe_not_found(self):
        """Test IFrameNotFound exception."""
        with pytest.raises(IFrameNotFound) as exc_info:
            raise IFrameNotFound()
        assert str(exc_info.value) == 'The iframe was not found'

    def test_iframe_not_found_custom(self):
        """Test IFrameNotFound with custom message."""
        custom_message = 'IFrame with name "content" not found'
        with pytest.raises(IFrameNotFound) as exc_info:
            raise IFrameNotFound(custom_message)
        assert str(exc_info.value) == custom_message


class TestExceptionInheritance:
    """Test exception inheritance hierarchy."""

    def test_all_exceptions_inherit_from_pydoll_exception(self):
        """Test that all custom exceptions inherit from PydollException."""
        exceptions_to_test = [
            ConnectionFailed, ReconnectionFailed, WebSocketConnectionClosed, NetworkError,
            BrowserNotRunning, FailedToStartBrowser, UnsupportedOS, NoValidTabFound,
            InvalidCommand, InvalidResponse, ResendCommandFailed, CommandExecutionTimeout,
            InvalidCallback, EventNotSupported, ElementNotFound, ElementNotVisible,
            ElementNotInteractable, ClickIntercepted, ElementNotAFileInput,
            PageLoadTimeout, WaitElementTimeout, InvalidOptionsObject, InvalidBrowserPath,
            ArgumentAlreadyExistsInOptions, InvalidFileExtension, NoDialogPresent,
            NotAnIFrame, InvalidIFrame, IFrameNotFound
        ]
        
        for exception_class in exceptions_to_test:
            assert issubclass(exception_class, PydollException), f"{exception_class.__name__} should inherit from PydollException"

    def test_base_exception_categories(self):
        """Test that base exception categories inherit from PydollException."""
        base_exceptions = [
            ConnectionException, BrowserException, ProtocolException,
            ElementException, TimeoutException, ConfigurationException, DialogException
        ]
        
        for exception_class in base_exceptions:
            assert issubclass(exception_class, PydollException), f"{exception_class.__name__} should inherit from PydollException"

    def test_connection_exceptions_inherit_from_connection_exception(self):
        """Test that connection exceptions inherit from ConnectionException."""
        connection_exceptions = [ConnectionFailed, ReconnectionFailed, WebSocketConnectionClosed, NetworkError]
        
        for exception_class in connection_exceptions:
            assert issubclass(exception_class, ConnectionException), f"{exception_class.__name__} should inherit from ConnectionException"


================================================
FILE: tests/test_find_elements_mixin.py
================================================
import pytest
import re
from unittest.mock import AsyncMock, MagicMock, patch

from pydoll.elements.mixins.find_elements_mixin import FindElementsMixin
from pydoll.elements.utils import SelectorParser
from pydoll.constants import By
from pydoll.exceptions import ElementNotFound, WaitElementTimeout


class MockFindElementsMixin(FindElementsMixin):
    """Mock implementation of FindElementsMixin for testing."""
    
    def __init__(self):
        self._connection_handler = AsyncMock()
        # Some tests need object_id, others don't
        self._object_id = None


class TestBuildXPath:
    """Test the _build_xpath static method comprehensively."""

    def test_build_xpath_single_id(self):
        """Test XPath building with only ID."""
        xpath = FindElementsMixin._build_xpath(id='test-id')
        assert xpath == '//*[@id="test-id"]'

    def test_build_xpath_single_class_name(self):
        """Test XPath building with only class name."""
        xpath = FindElementsMixin._build_xpath(class_name='btn-primary')
        expected = '//*[contains(concat(" ", normalize-space(@class), " "), " btn-primary ")]'
        assert xpath == expected

    def test_build_xpath_single_name(self):
        """Test XPath building with only name attribute."""
        xpath = FindElementsMixin._build_xpath(name='username')
        assert xpath == '//*[@name="username"]'

    def test_build_xpath_single_tag_name(self):
        """Test XPath building with only tag name."""
        xpath = FindElementsMixin._build_xpath(tag_name='button')
        assert xpath == '//button'

    def test_build_xpath_single_text(self):
        """Test XPath building with only text content."""
        xpath = FindElementsMixin._build_xpath(text='Click me')
        assert xpath == '//*[contains(text(), "Click me")]'

    def test_build_xpath_single_custom_attribute(self):
        """Test XPath building with single custom attribute."""
        xpath = FindElementsMixin._build_xpath(data_testid='submit-btn')
        assert xpath == '//*[@data-testid="submit-btn"]'

    def test_build_xpath_id_and_class(self):
        """Test XPath building with ID and class name."""
        xpath = FindElementsMixin._build_xpath(id='main-btn', class_name='primary')
        expected = '//*[@id="main-btn" and contains(concat(" ", normalize-space(@class), " "), " primary ")]'
        assert xpath == expected

    def test_build_xpath_tag_and_attributes(self):
        """Test XPath building with tag name and multiple attributes."""
        xpath = FindElementsMixin._build_xpath(
            tag_name='input',
            id='email-field',
            name='email',
            type='email'
        )
        expected = '//input[@id="email-field" and @name="email" and @type="email"]'
        assert xpath == expected

    def test_build_xpath_all_parameters(self):
        """Test XPath building with all possible parameters."""
        xpath = FindElementsMixin._build_xpath(
            id='complex-element',
            class_name='form-control',
            name='user_input',
            tag_name='input',
            text='placeholder text',
            data_role='textbox',
            aria_label='User input field'
        )
        expected = ('//input[@id="complex-element" and '
                   'contains(concat(" ", normalize-space(@class), " "), " form-control ") and '
                   '@name="user_input" and '
                   'contains(text(), "placeholder text") and '
                   '@data-role="textbox" and '
                   '@aria-label="User input field"]')
        assert xpath == expected

    def test_build_xpath_text_with_quotes(self):
        """Test XPath building with text containing quotes."""
        xpath = FindElementsMixin._build_xpath(text='Say "Hello"')
        assert xpath == '//*[contains(text(), "Say "Hello"")]'

    def test_build_xpath_attribute_with_quotes(self):
        """Test XPath building with attribute value containing quotes."""
        xpath = FindElementsMixin._build_xpath(title='This is a "quoted" title')
        assert xpath == '//*[@title="This is a "quoted" title"]'

    def test_build_xpath_empty_values_ignored(self):
        """Test that empty string values are ignored in XPath building."""
        xpath = FindElementsMixin._build_xpath(
            id='test-id',
            class_name='',  # Empty string should be ignored
            name=None,      # None should be ignored
            tag_name='div'
        )
        assert xpath == '//div[@id="test-id"]'

    def test_build_xpath_class_name_with_spaces(self):
        """Test XPath building with class name that has spaces (edge case)."""
        xpath = FindElementsMixin._build_xpath(class_name='btn primary large')
        expected = '//*[contains(concat(" ", normalize-space(@class), " "), " btn primary large ")]'
        assert xpath == expected

    def test_build_xpath_special_characters_in_attributes(self):
        """Test XPath building with special characters in attribute values."""
        xpath = FindElementsMixin._build_xpath(
            data_value='test@example.com',
            aria_describedby='field-help-123'
        )
        expected = '//*[@data-value="test@example.com" and @aria-describedby="field-help-123"]'
        assert xpath == expected

    def test_build_xpath_numeric_attribute_values(self):
        """Test XPath building with numeric attribute values."""
        xpath = FindElementsMixin._build_xpath(
            tabindex='0',
            maxlength='255'
        )
        expected = '//*[@tabindex="0" and @maxlength="255"]'
        assert xpath == expected

    def test_build_xpath_no_parameters(self):
        """Test XPath building with no parameters returns generic selector."""
        xpath = FindElementsMixin._build_xpath()
        assert xpath == '//*'

    def test_build_xpath_only_tag_name(self):
        """Test XPath building with only tag name."""
        xpath = FindElementsMixin._build_xpath(tag_name='span')
        assert xpath == '//span'

    def test_build_xpath_hyphenated_attributes(self):
        """Test XPath building with hyphenated attribute names."""
        xpath = FindElementsMixin._build_xpath(
            **{'data-test-id': 'submit-button', 'aria-label': 'Submit form'}
        )
        expected = '//*[@data-test-id="submit-button" and @aria-label="Submit form"]'
        assert xpath == expected


class TestGetExpressionType:
    """Test the _get_expression_type static method."""

    def test_xpath_double_slash(self):
        """Test XPath detection with double slash."""
        assert FindElementsMixin._get_expression_type('//div') == By.XPATH

    def test_xpath_dot_double_slash(self):
        """Test XPath detection with dot double slash."""
        assert FindElementsMixin._get_expression_type('.//span') == By.XPATH

    def test_xpath_dot_slash(self):
        """Test XPath detection with dot slash."""
        assert FindElementsMixin._get_expression_type('./button') == By.XPATH

    def test_xpath_single_slash(self):
        """Test XPath detection with single slash."""
        assert FindElementsMixin._get_expression_type('/html/body') == By.XPATH

    def test_css_selector_default(self):
        """Test CSS selector as default."""
        assert FindElementsMixin._get_expression_type('div.content > p') == By.CSS_SELECTOR

    def test_css_selector_attribute(self):
        """Test CSS selector with attributes."""
        assert FindElementsMixin._get_expression_type('input[type="text"]') == By.CSS_SELECTOR

    def test_css_selector_pseudo_class(self):
        """Test CSS selector with pseudo-classes."""
        assert FindElementsMixin._get_expression_type('button:hover') == By.CSS_SELECTOR
    
    def test_css_selector_not_xpath(self):
        """Test that css selector doesn't conflict with XPath dot slash."""
        assert FindElementsMixin._get_expression_type('.button') == By.CSS_SELECTOR
        assert FindElementsMixin._get_expression_type('./button') == By.XPATH

    def test_complex_xpath_expressions(self):
        """Test complex XPath expressions are detected correctly."""
        complex_xpaths = [
            '//div[@class="content"]/p[contains(text(), "Hello")]',
            './/button[position()=1]',
            './/*[@id="test" and @class="active"]',
            '/html/body/div[1]/form/input[@type="submit"]'
        ]
        for xpath in complex_xpaths:
            assert FindElementsMixin._get_expression_type(xpath) == By.XPATH

    def test_edge_case_expressions(self):
        """Test edge case expressions."""
        # Empty string should default to CSS
        assert FindElementsMixin._get_expression_type('') == By.CSS_SELECTOR

    def test_xpath_with_parentheses_and_predicate(self):
        """Test XPath detection with parentheses, e.g. (//div)[last()]."""
        expressions = [
            '(//div)[last()]',
            '(//span[@class="btn"])[1]',
            '(/html/body/div)[position()=1]'
        ]
        for expr in expressions:
            assert FindElementsMixin._get_expression_type(expr) == By.XPATH


class TestEnsureRelativeXPath:
    """Test the _ensure_relative_xpath static method."""

    def test_absolute_xpath_becomes_relative(self):
        """Test that absolute XPath becomes relative."""
        xpath = '//div[@id="test"]'
        result = FindElementsMixin._ensure_relative_xpath(xpath)
        assert result == './/div[@id="test"]'

    def test_already_relative_xpath_unchanged(self):
        """Test that already relative XPath remains unchanged."""
        xpath = './/div[@id="test"]'
        result = FindElementsMixin._ensure_relative_xpath(xpath)
        assert result == './/div[@id="test"]'

    def test_dot_slash_xpath_unchanged(self):
        """Test that dot slash XPath remains unchanged."""
        xpath = './button'
        result = FindElementsMixin._ensure_relative_xpath(xpath)
        assert result == './button'

    def test_single_slash_xpath_becomes_relative(self):
        """Test that single slash XPath becomes relative."""
        xpath = '/html/body/div'
        result = FindElementsMixin._ensure_relative_xpath(xpath)
        assert result == './html/body/div'

    def test_empty_xpath(self):
        """Test empty XPath handling."""
        xpath = ''
        result = FindElementsMixin._ensure_relative_xpath(xpath)
        assert result == '.'

    def test_complex_xpath_expressions(self):
        """Test complex XPath expressions."""
        test_cases = [
            ('//div[contains(@class, "test")]', './/div[contains(@class, "test")]'),
            ('.//span[@id="existing"]', './/span[@id="existing"]'),
            ('//*[@data-test="value"]', './/*[@data-test="value"]'),
            ('//button[text()="Submit"]', './/button[text()="Submit"]')
        ]
        
        for input_xpath, expected in test_cases:
            result = FindElementsMixin._ensure_relative_xpath(input_xpath)
            assert result == expected


class TestGetByAndValue:
    """Test the _get_by_and_value method."""

    def setup_method(self):
        """Set up test fixtures."""
        self.mixin = MockFindElementsMixin()
        self.by_map = {
            'id': By.ID,
            'class_name': By.CLASS_NAME,
            'name': By.NAME,
            'tag_name': By.TAG_NAME,
            'xpath': By.XPATH,
        }

    def test_single_id_selector(self):
        """Test single ID selector returns direct By.ID."""
        by, value = self.mixin._get_by_and_value(self.by_map, id='test-id')
        assert by == By.ID
        assert value == 'test-id'

    def test_single_class_name_selector(self):
        """Test single class name selector returns direct By.CLASS_NAME."""
        by, value = self.mixin._get_by_and_value(self.by_map, class_name='btn-primary')
        assert by == By.CLASS_NAME
        assert value == 'btn-primary'

    def test_single_name_selector(self):
        """Test single name selector returns direct By.NAME."""
        by, value = self.mixin._get_by_and_value(self.by_map, name='username')
        assert by == By.NAME
        assert value == 'username'

    def test_single_tag_name_selector(self):
        """Test single tag name selector returns direct By.TAG_NAME."""
        by, value = self.mixin._get_by_and_value(self.by_map, tag_name='button')
        assert by == By.TAG_NAME
        assert value == 'button'

    def test_single_custom_attribute(self):
        """Test single custom attribute builds XPath."""
        by, value = self.mixin._get_by_and_value(self.by_map, data_testid='submit-btn')
        assert by == By.XPATH
        assert value == '//*[@data-testid="submit-btn"]'

    def test_multiple_attributes_build_xpath(self):
        """Test multiple attributes build XPath."""
        by, value = self.mixin._get_by_and_value(
            self.by_map, 
            id='test-id', 
            class_name='btn-primary'
        )
        assert by == By.XPATH
        expected = '//*[@id="test-id" and contains(concat(" ", normalize-space(@class), " "), " btn-primary ")]'
        assert value == expected

    def test_text_with_single_attribute_builds_xpath(self):
        """Test that text with any other attribute builds XPath."""
        by, value = self.mixin._get_by_and_value(
            self.by_map,
            id='test-id',
            text='Click me'
        )
        assert by == By.XPATH
        expected = '//*[@id="test-id" and contains(text(), "Click me")]'
        assert value == expected

    def test_text_alone_builds_xpath(self):
        """Test that text alone builds XPath."""
        by, value = self.mixin._get_by_and_value(self.by_map, text='Submit')
        assert by == By.XPATH
        assert value == '//*[contains(text(), "Submit")]'

    def test_empty_values_ignored(self):
        """Test that empty values are ignored in selector building."""
        by, value = self.mixin._get_by_and_value(
            self.by_map,
            id='test-id',
            class_name='',  # Empty string
            name=None       # None value
        )
        assert by == By.ID
        assert value == 'test-id'

    def test_all_empty_values_with_custom_attribute(self):
        """Test custom attribute when standard attributes are empty."""
        by, value = self.mixin._get_by_and_value(
            self.by_map,
            id='',
            class_name=None,
            data_role='button'
        )
        assert by == By.XPATH
        assert value == '//*[@data-role="button"]'


class TestFindElementsMixinEdgeCases:
    """Test edge cases and error conditions in FindElementsMixin."""

    def setup_method(self):
        """Set up test fixtures."""
        self.mixin = MockFindElementsMixin()

    @pytest.mark.asyncio
    async def test_find_no_criteria_raises_error(self):
        """Test that find with no criteria raises ValueError."""
        with pytest.raises(ValueError, match='At least one of the following arguments must be provided'):
            await self.mixin.find()

    @pytest.mark.asyncio
    async def test_find_empty_string_criteria_raises_error(self):
        """Test that find with only empty string criteria raises ValueError."""
        with pytest.raises(ValueError, match='At least one of the following arguments must be provided'):
            await self.mixin.find(id='', class_name='', name='', tag_name='', text='')

    @pytest.mark.asyncio
    async def test_find_none_criteria_raises_error(self):
        """Test that find with only None criteria raises ValueError."""
        with pytest.raises(ValueError, match='At least one of the following arguments must be provided'):
            await self.mixin.find(id=None, class_name=None, name=None, tag_name=None, text=None)

    @pytest.mark.asyncio
    async def test_find_with_custom_attributes_only(self):
        """Test find with only custom attributes works."""
        # Mock the internal methods
        self.mixin._find_element = AsyncMock(return_value=MagicMock())
        
        result = await self.mixin.find(data_testid='submit-button')
        
        # Should call _find_element with XPath
        self.mixin._find_element.assert_called_once()
        call_args = self.mixin._find_element.call_args[0]
        assert call_args[0] == By.XPATH
        assert '@data-testid="submit-button"' in call_args[1]

    @pytest.mark.asyncio
    async def test_query_empty_expression(self):
        """Test query with empty expression."""
        self.mixin._find_element = AsyncMock(return_value=MagicMock())
        
        result = await self.mixin.query('')
        
        # Should call _find_element with CSS_SELECTOR (default)
        self.mixin._find_element.assert_called_once()
        call_args = self.mixin._find_element.call_args[0]
        assert call_args[0] == By.CSS_SELECTOR
        assert call_args[1] == ''

    @pytest.mark.asyncio
    async def test_find_or_wait_element_timeout_zero(self):
        """Test find_or_wait_element with timeout=0 calls find immediately."""
        self.mixin._find_element = AsyncMock(return_value=MagicMock())
        
        result = await self.mixin.find_or_wait_element(By.ID, 'test-id', timeout=0)
        
        self.mixin._find_element.assert_called_once_with(By.ID, 'test-id', raise_exc=True)

    @pytest.mark.asyncio
    async def test_find_or_wait_element_timeout_success_on_retry(self):
        """Test find_or_wait_element succeeds on retry within timeout."""
        # First call returns None, second call returns element
        mock_element = MagicMock()
        self.mixin._find_element = AsyncMock(side_effect=[None, mock_element])
        
        with patch('asyncio.sleep') as mock_sleep, \
             patch('asyncio.get_event_loop') as mock_loop:
            # Mock time progression
            mock_loop.return_value.time.side_effect = [0, 0.5, 1.0]
            
            result = await self.mixin.find_or_wait_element(
                By.ID, 'test-id', timeout=2, raise_exc=False
            )
        
        assert result == mock_element
        assert self.mixin._find_element.call_count == 2
        mock_sleep.assert_called_once_with(0.5)

    @pytest.mark.asyncio
    async def test_find_or_wait_element_timeout_failure(self):
        """Test find_or_wait_element raises WaitElementTimeout."""
        self.mixin._find_element = AsyncMock(return_value=None)
        
        with patch('asyncio.sleep') as mock_sleep, \
             patch('asyncio.get_event_loop') as mock_loop:
            # Mock time progression that exceeds timeout
            mock_loop.return_value.time.side_effect = [0, 0.5, 1.0, 1.5, 2.1]
            
            with pytest.raises(WaitElementTimeout):
                await self.mixin.find_or_wait_element(
                    By.ID, 'test-id', timeout=2, raise_exc=True
                )

    @pytest.mark.asyncio
    async def test_find_or_wait_element_timeout_failure_no_exception(self):
        """Test find_or_wait_element returns None when raise_exc=False."""
        self.mixin._find_element = AsyncMock(return_value=None)
        
        with patch('asyncio.sleep') as mock_sleep, \
             patch('asyncio.get_event_loop') as mock_loop:
            # Mock time progression that exceeds timeout
            mock_loop.return_value.time.side_effect = [0, 0.5, 1.0, 1.5, 2.1]
            
            result = await self.mixin.find_or_wait_element(
                By.ID, 'test-id', timeout=2, raise_exc=False
            )
        
        assert result is None

    @pytest.mark.asyncio
    async def test_find_elements_with_timeout(self):
        """Test find with find_all=True and timeout."""
        mock_elements = [MagicMock(), MagicMock()]
        self.mixin._find_elements = AsyncMock(return_value=mock_elements)
        
        result = await self.mixin.find_or_wait_element(
            By.CLASS_NAME, 'item', timeout=1, find_all=True
        )
        
        assert result == mock_elements
        self.mixin._find_elements.assert_called_once()

    def test_regex_pattern_in_get_expression_type(self):
        """Test the regex pattern used in _get_expression_type."""
        xpath_pattern = r'^(//|\.//|\.\/|/)'
        
        # Test cases that should match
        xpath_expressions = [
            '//div',
            './/span', 
            './button',
            '/html/body'
        ]
        
        for expr in xpath_expressions:
            assert re.match(xpath_pattern, expr), f"Pattern should match: {expr}"
        
        # Test cases that should not match
        non_xpath_expressions = [
            'div.class',
            '#id',
            '.class',
            'input[type="text"]',
            'button:hover'
        ]
        
        for expr in non_xpath_expressions:
            assert not re.match(xpath_pattern, expr), f"Pattern should not match: {expr}"

    def test_xpath_building_with_boolean_attributes(self):
        """Test XPath building with boolean-like attributes."""
        xpath = FindElementsMixin._build_xpath(
            required='true',
            disabled='false',
            checked='checked'
        )
        expected = '//*[@required="true" and @disabled="false" and @checked="checked"]'
        assert xpath == expected

    def test_xpath_building_preserves_attribute_order(self):
        """Test that XPath building maintains consistent attribute order."""
        # Test multiple times to ensure consistency
        for _ in range(5):
            xpath = FindElementsMixin._build_xpath(
                id='test',
                class_name='btn',
                name='submit',
                data_role='button'
            )
            # The order should be: id, class_name, name, then custom attributes
            assert '@id="test"' in xpath
            assert 'contains(concat(" ", normalize-space(@class), " "), " btn ")' in xpath
            assert '@name="submit"' in xpath
            assert '@data-role="button"' in xpath

    def test_xpath_building_with_unicode_characters(self):
        """Test XPath building with Unicode characters."""
        xpath = FindElementsMixin._build_xpath(
            text='Olá mundo',
            title='Título com acentos',
            placeholder='Escreva aqui...'
        )
        expected = '//*[contains(text(), "Olá mundo") and @title="Título com acentos" and @placeholder="Escreva aqui..."]'
        assert xpath == expected

    def test_class_name_xpath_normalization(self):
        """Test that class name XPath uses proper normalization."""
        xpath = FindElementsMixin._build_xpath(class_name='test-class')
        
        # Should use normalize-space to handle multiple spaces
        assert 'normalize-space(@class)' in xpath
        # Should wrap with spaces to match exact class names
        assert '" test-class "' in xpath
        # Should use concat to add spaces
        assert 'concat(" "' in xpath


class TestUnderscoreToHyphenConversion:
    """Test automatic conversion of underscores to hyphens in attribute names."""

    def test_single_underscore_to_hyphen(self):
        """Test single underscore conversion in attribute name."""
        xpath = FindElementsMixin._build_xpath(data_test='submit-button')
        assert xpath == '//*[@data-test="submit-button"]'

    def test_multiple_underscores_to_hyphens(self):
        """Test multiple underscores conversion in same attribute."""
        xpath = FindElementsMixin._build_xpath(data_test_id='submit-button')
        assert xpath == '//*[@data-test-id="submit-button"]'

    def test_aria_attributes_conversion(self):
        """Test aria attributes underscore conversion."""
        xpath = FindElementsMixin._build_xpath(
            aria_label='Submit form',
            aria_describedby='helper-text'
        )
        assert '@aria-label="Submit form"' in xpath
        assert '@aria-describedby="helper-text"' in xpath

    def test_data_attributes_conversion(self):
        """Test data attributes underscore conversion."""
        xpath = FindElementsMixin._build_xpath(
            data_testid='main-button',
            data_value='123',
            data_action='submit'
        )
        assert '@data-testid="main-button"' in xpath
        assert '@data-value="123"' in xpath
        assert '@data-action="submit"' in xpath

    def test_mixed_underscore_and_hyphen_attributes(self):
        """Test that attributes already with hyphens are not affected."""
        # Using dict unpacking for attributes with hyphens
        xpath = FindElementsMixin._build_xpath(
            data_test='value1',
            **{'already-hyphenated': 'value2'}
        )
        assert '@data-test="value1"' in xpath
        assert '@already-hyphenated="value2"' in xpath

    def test_combined_standard_and_custom_attributes(self):
        """Test conversion works with combined standard and custom attributes."""
        xpath = FindElementsMixin._build_xpath(
            id='main-element',
            class_name='btn',
            data_testid='submit-btn',
            aria_label='Submit button'
        )
        assert '@id="main-element"' in xpath
        assert 'contains(concat(" ", normalize-space(@class), " "), " btn ")' in xpath
        assert '@data-testid="submit-btn"' in xpath
        assert '@aria-label="Submit button"' in xpath

    def test_underscore_in_attribute_value_unchanged(self):
        """Test that underscores in values are not converted."""
        xpath = FindElementsMixin._build_xpath(data_test='some_value_with_underscores')
        assert xpath == '//*[@data-test="some_value_with_underscores"]'
        assert 'some_value_with_underscores' in xpath  # Value unchanged

    def test_complex_attribute_names_conversion(self):
        """Test conversion of complex attribute names."""
        xpath = FindElementsMixin._build_xpath(
            ng_repeat='item in items',
            v_model='username',
            x_bind_value='someValue'
        )
        assert '@ng-repeat="item in items"' in xpath
        assert '@v-model="username"' in xpath
        assert '@x-bind-value="someValue"' in xpath

    def test_single_character_segments(self):
        """Test attributes with single character segments."""
        xpath = FindElementsMixin._build_xpath(
            a_b_c='value1',
            x_y='value2'
        )
        assert '@a-b-c="value1"' in xpath
        assert '@x-y="value2"' in xpath

    def test_no_underscores_unchanged(self):
        """Test attributes without underscores remain unchanged."""
        xpath = FindElementsMixin._build_xpath(
            role='button',
            type='submit',
            disabled='true'
        )
        assert '@role="button"' in xpath
        assert '@type="submit"' in xpath
        assert '@disabled="true"' in xpath

    def test_trailing_and_leading_underscores(self):
        """Test handling of trailing and leading underscores."""
        xpath = FindElementsMixin._build_xpath(
            _private='value1',
            public_='value2',
            _both_='value3'
        )
        # Leading/trailing underscores should also be converted to hyphens
        assert '@-private="value1"' in xpath
        assert '@public-="value2"' in xpath
        assert '@-both-="value3"' in xpath

    def test_conversion_with_text_parameter(self):
        """Test conversion works correctly with text parameter."""
        xpath = FindElementsMixin._build_xpath(
            text='Button text',
            data_testid='submit-btn'
        )
        assert 'contains(text(), "Button text")' in xpath
        assert '@data-testid="submit-btn"' in xpath

    def test_conversion_with_tag_name(self):
        """Test conversion works correctly with tag_name parameter."""
        xpath = FindElementsMixin._build_xpath(
            tag_name='button',
            data_test='submit',
            aria_label='Submit form'
        )
        assert xpath.startswith('//button')
        assert '@data-test="submit"' in xpath
        assert '@aria-label="Submit form"' in xpath


class TestUnderscoreConversionWithGetByAndValue:
    """Test underscore to hyphen conversion in _get_by_and_value method."""

    def setup_method(self):
        """Set up test fixtures."""
        self.mixin = MockFindElementsMixin()
        self.by_map = {
            'id': By.ID,
            'class_name': By.CLASS_NAME,
            'name': By.NAME,
            'tag_name': By.TAG_NAME,
            'xpath': By.XPATH,
        }

    def test_custom_attribute_with_underscore(self):
        """Test custom attribute with underscore converts properly."""
        by, value = self.mixin._get_by_and_value(
            self.by_map,
            data_testid='submit-button'
        )
        assert by == By.XPATH
        assert '@data-testid="submit-button"' in value

    def test_multiple_custom_attributes_with_underscores(self):
        """Test multiple custom attributes with underscores."""
        by, value = self.mixin._get_by_and_value(
            self.by_map,
            data_test='value1',
            aria_label='value2',
            ng_model='value3'
        )
        assert by == By.XPATH
        assert '@data-test="value1"' in value
        assert '@aria-label="value2"' in value
        assert '@ng-model="value3"' in value

    def test_standard_and_custom_attributes_mixed(self):
        """Test standard attributes with custom underscore attributes."""
        by, value = self.mixin._get_by_and_value(
            self.by_map,
            id='main-btn',
            data_testid='submit',
            aria_label='Submit'
        )
        assert by == By.XPATH
        assert '@id="main-btn"' in value
        assert '@data-testid="submit"' in value
        assert '@aria-label="Submit"' in value


class TestFindElementsSymbolFiltering:
    """Test that Symbol properties are filtered from element query results."""

    def setup_method(self):
        """Set up test fixtures."""
        self.mixin = MockFindElementsMixin()

    @pytest.mark.asyncio
    async def test_find_elements_filters_symbol_properties(self):
        """Test that Symbol properties are excluded from results."""
        find_response = {'result': {'result': {'objectId': 'arr'}}}
        properties_response = {
            'result': {
                'result': [
                    {'name': '0', 'value': {'type': 'object', 'objectId': 'el-1'}},
                    {'name': '1', 'value': {'type': 'object', 'objectId': 'el-2'}},
                    {'name': 'Symbol(Symbol.unscopables)', 'value': {'type': 'object', 'objectId': 'sym'}},
                    {'name': 'length', 'value': {'type': 'number', 'value': 2}},
                ]
            }
        }
        describe_response = {'result': {'node': {'nodeName': 'A', 'attributes': []}}}

        self.mixin._connection_handler.execute_command.side_effect = [
            find_response,
            properties_response,
            describe_response,
            describe_response,
        ]

        elements = await self.mixin._find_elements(By.CSS_SELECTOR, 'a')

        assert len(elements) == 2


class TestParseIframeSegmentsXPath:
    """Test _SelectorParser.parse_iframe_segments_xpath static method — pure sync, no mocks."""

    @pytest.mark.parametrize(
        'expression, expected_selectors',
        [
            # Basic iframe crossing
            (
                '//iframe/body',
                ['//iframe', '//body'],
            ),
            # Iframe with attribute predicate
            (
                '//iframe[@src*="example.com"]/body',
                ['//iframe[@src*="example.com"]', '//body'],
            ),
            # Iframe with slashes inside quoted attribute
            (
                '//iframe[@src="url/with/slashes"]/body',
                ['//iframe[@src="url/with/slashes"]', '//body'],
            ),
            # Iframe not at root — simple
            (
                '//div/iframe/div',
                ['//div/iframe', '//div'],
            ),
            # Iframe not at root — with attributes
            (
                '//div[@class="wrapper"]/iframe/body',
                ['//div[@class="wrapper"]/iframe', '//body'],
            ),
            # Case insensitive — uppercase
            (
                '//IFRAME/body',
                ['//IFRAME', '//body'],
            ),
            # Case insensitive — mixed case
            (
                '//IFrame/body',
                ['//IFrame', '//body'],
            ),
            # Nested iframes
            (
                '//iframe/iframe/div',
                ['//iframe', '//iframe', '//div'],
            ),
            # Nested iframes with attributes
            (
                '//iframe[@src="a"]/div/iframe[@id="inner"]/span',
                ['//iframe[@src="a"]', '//div/iframe[@id="inner"]', '//span'],
            ),
            # Bracket chars inside quoted attribute
            (
                '//iframe[@src="a[1]/b"]/body',
                ['//iframe[@src="a[1]/b"]', '//body'],
            ),
            # Multiple steps after iframe
            (
                '//iframe[@src*="cloudflare"]/body/div',
                ['//iframe[@src*="cloudflare"]', '//body/div'],
            ),
            # contains() in predicate with "iframe" as string value
            (
                '//iframe[contains(@src, "iframe")]/body',
                ['//iframe[contains(@src, "iframe")]', '//body'],
            ),
            # Multiple predicate conditions
            (
                '//iframe[@src="a" and @id="b"]/body',
                ['//iframe[@src="a" and @id="b"]', '//body'],
            ),
            # position() predicate
            (
                '//iframe[position()=1]/body',
                ['//iframe[position()=1]', '//body'],
            ),
            # not() predicate
            (
                '//iframe[not(@disabled)]/body',
                ['//iframe[not(@disabled)]', '//body'],
            ),
            # Grouped expression
            (
                '(//iframe)[1]/body',
                ['(//iframe)[1]', '//body'],
            ),
        ],
    )
    def test_splits(self, expression, expected_selectors):
        segments = SelectorParser.parse_iframe_segments_xpath(expression)
        assert len(segments) == len(expected_selectors)
        for (by, sel), expected in zip(segments, expected_selectors):
            assert by == By.XPATH
            assert sel == expected

    @pytest.mark.parametrize(
        'expression',
        [
            '//iframe',
            '//iframe[@src="example.com"]',
            './/iframe',
            '//div[contains(@class, "iframe")]/p',
            '//div[@data-iframe="true"]/p',
            '//body/div/span',
            '//div[@title="This is an iframe container"]/span',
        ],
    )
    def test_no_split(self, expression):
        segments = SelectorParser.parse_iframe_segments_xpath(expression)
        assert len(segments) == 1
        assert segments[0] == (By.XPATH, expression)


class TestParseIframeSegmentsCSS:
    """Test _SelectorParser.parse_iframe_segments_css static method — pure sync, no mocks."""

    @pytest.mark.parametrize(
        'expression, expected_selectors',
        [
            # Basic > combinator
            (
                'iframe > body',
                ['iframe', 'body'],
            ),
            # Iframe with attribute
            (
                'iframe[src*="example"] > body',
                ['iframe[src*="example"]', 'body'],
            ),
            # Descendant (space) combinator
            (
                'iframe body',
                ['iframe', 'body'],
            ),
            # Descendant with attribute
            (
                'iframe[src*="..."] body',
                ['iframe[src*="..."]', 'body'],
            ),
            # Case insensitive — uppercase
            (
                'IFRAME > body',
                ['IFRAME', 'body'],
            ),
            # Case insensitive — mixed case
            (
                'IFrame > body',
                ['IFrame', 'body'],
            ),
            # Nested iframes
            (
                'iframe > iframe > div',
                ['iframe', 'iframe', 'div'],
            ),
            # Pseudo-class on iframe
            (
                'iframe:nth-child(2) > body',
                ['iframe:nth-child(2)', 'body'],
            ),
            # > inside quoted attribute value
            (
                'iframe[src="value with > arrow"] > body',
                ['iframe[src="value with > arrow"]', 'body'],
            ),
            # Attribute selector before iframe
            (
                '[data-iframe] iframe > body',
                ['[data-iframe] iframe', 'body'],
            ),
            # Multiple steps after iframe
            (
                'iframe[src*="cloudflare"] > body > div.target',
                ['iframe[src*="cloudflare"]', 'body > div.target'],
            ),
            # Simple prefix — div > iframe > div
            (
                'div > iframe > div',
                ['div > iframe', 'div'],
            ),
            # Descendant combinator with prefix
            (
                'div iframe > body',
                ['div iframe', 'body'],
            ),
            # Child combinator with prefix
            (
                'div > iframe > body',
                ['div > iframe', 'body'],
            ),
            # Nested iframes with attributes
            (
                'iframe[src*="a"] > div > iframe[id="inner"] > span',
                ['iframe[src*="a"]', 'div > iframe[id="inner"]', 'span'],
            ),
            # Extra spaces around combinator
            (
                'iframe  >  body',
                ['iframe', 'body'],
            ),
        ],
    )
    def test_splits(self, expression, expected_selectors):
        segments = SelectorParser.parse_iframe_segments_css(expression)
        assert len(segments) == len(expected_selectors)
        for (by, sel), expected in zip(segments, expected_selectors):
            assert by == By.CSS_SELECTOR
            assert sel == expected

    @pytest.mark.parametrize(
        'expression',
        [
            '.iframe > body',
            '#iframe > body',
            'div.iframe > body',
            ':not(iframe) > body',
            ':is(iframe, div) > body',
            'iframe[src*="..."]',
            'iframe',
            'div > span > p',
            '[data-type="iframe"] > body',
        ],
    )
    def test_no_split(self, expression):
        segments = SelectorParser.parse_iframe_segments_css(expression)
        assert len(segments) == 1
        assert segments[0] == (By.CSS_SELECTOR, expression)


class TestFindAcrossIframes:
    """Test _find_across_iframes and _attempt_find_across_iframes async methods."""

    def setup_method(self):
        self.mixin = MockFindElementsMixin()

    @pytest.mark.asyncio
    async def test_css_single_iframe_crossing(self):
        """query('iframe > body') — finds iframe, then body inside it."""
        mock_iframe = MagicMock()
        mock_iframe.is_iframe = True
        mock_iframe._find_element = AsyncMock(return_value=MagicMock(name='body'))

        self.mixin._find_element = AsyncMock(return_value=mock_iframe)

        result = await self.mixin.find_or_wait_element(
            By.CSS_SELECTOR, 'iframe > body', timeout=0
        )

        # First call: find iframe on the page
        self.mixin._find_element.assert_called_once_with(
            By.CSS_SELECTOR, 'iframe', raise_exc=False
        )
        # Second call: find body inside iframe
        mock_iframe._find_element.assert_called_once_with(
            By.CSS_SELECTOR, 'body', raise_exc=False
        )
        assert result is not None

    @pytest.mark.asyncio
    async def test_xpath_single_iframe_crossing(self):
        """query('//iframe/body') — finds iframe, then body inside it."""
        mock_iframe = MagicMock()
        mock_iframe.is_iframe = True
        mock_iframe._find_element = AsyncMock(return_value=MagicMock(name='body'))

        self.mixin._find_element = AsyncMock(return_value=mock_iframe)

        result = await self.mixin.find_or_wait_element(
            By.XPATH, '//iframe/body', timeout=0
        )

        self.mixin._find_element.assert_called_once_with(
            By.XPATH, '//iframe', raise_exc=False
        )
        mock_iframe._find_element.assert_called_once_with(
            By.XPATH, '//body', raise_exc=False
        )
        assert result is not None

    @pytest.mark.asyncio
    async def test_nested_iframe_crossing(self):
        """query('iframe > iframe > div') — 3 segments, 3 find calls."""
        mock_inner_iframe = MagicMock()
        mock_inner_iframe.is_iframe = True
        mock_div = MagicMock(name='div')
        mock_inner_iframe._find_element = AsyncMock(return_value=mock_div)

        mock_outer_iframe = MagicMock()
        mock_outer_iframe.is_iframe = True
        mock_outer_iframe._find_element = AsyncMock(return_value=mock_inner_iframe)

        self.mixin._find_element = AsyncMock(return_value=mock_outer_iframe)

        result = await self.mixin.find_or_wait_element(
            By.CSS_SELECTOR, 'iframe > iframe > div', timeout=0
        )

        self.mixin._find_element.assert_called_once_with(
            By.CSS_SELECTOR, 'iframe', raise_exc=False
        )
        mock_outer_iframe._find_element.assert_called_once_with(
            By.CSS_SELECTOR, 'iframe', raise_exc=False
        )
        mock_inner_iframe._find_element.assert_called_once_with(
            By.CSS_SELECTOR, 'div', raise_exc=False
        )
        assert result is mock_div

    @pytest.mark.asyncio
    async def test_xpath_iframe_not_at_root(self):
        """query('//div/iframe/div') — iframe is a child of div, not root."""
        mock_iframe = MagicMock()
        mock_iframe.is_iframe = True
        mock_div = MagicMock(name='inner_div')
        mock_iframe._find_element = AsyncMock(return_value=mock_div)

        self.mixin._find_element = AsyncMock(return_value=mock_iframe)

        result = await self.mixin.find_or_wait_element(
            By.XPATH, '//div/iframe/div', timeout=0
        )

        # First segment: //div/iframe (finds the iframe inside a div)
        self.mixin._find_element.assert_called_once_with(
            By.XPATH, '//div/iframe', raise_exc=False
        )
        # Second segment: //div (finds div inside the iframe)
        mock_iframe._find_element.assert_called_once_with(
            By.XPATH, '//div', raise_exc=False
        )
        assert result is mock_div

    @pytest.mark.asyncio
    async def test_css_iframe_not_at_root(self):
        """query('div > iframe > div') — iframe is a child of div, not root."""
        mock_iframe = MagicMock()
        mock_iframe.is_iframe = True
        mock_div = MagicMock(name='inner_div')
        mock_iframe._find_element = AsyncMock(return_value=mock_div)

        self.mixin._find_element = AsyncMock(return_value=mock_iframe)

        result = await self.mixin.find_or_wait_element(
            By.CSS_SELECTOR, 'div > iframe > div', timeout=0
        )

        # First segment: div > iframe (finds the iframe inside a div)
        self.mixin._find_element.assert_called_once_with(
            By.CSS_SELECTOR, 'div > iframe', raise_exc=False
        )
        # Second segment: div (finds div inside the iframe)
        mock_iframe._find_element.assert_called_once_with(
            By.CSS_SELECTOR, 'div', raise_exc=False
        )
        assert result is mock_div

    @pytest.mark.asyncio
    async def test_find_all_last_segment(self):
        """query('iframe > .item', find_all=True) — _find_elements for last segment."""
        mock_iframe = MagicMock()
        mock_iframe.is_iframe = True
        mock_items = [MagicMock(), MagicMock()]
        mock_iframe._find_elements = AsyncMock(return_value=mock_items)

        self.mixin._find_element = AsyncMock(return_value=mock_iframe)

        result = await self.mixin.find_or_wait_element(
            By.CSS_SELECTOR, 'iframe > .item', timeout=0, find_all=True
        )

        self.mixin._find_element.assert_called_once_with(
            By.CSS_SELECTOR, 'iframe', raise_exc=False
        )
        mock_iframe._find_elements.assert_called_once_with(
            By.CSS_SELECTOR, '.item', raise_exc=False
        )
        assert result == mock_items

    @pytest.mark.asyncio
    async def test_timeout_retry_succeeds(self):
        """First attempt fails (iframe not found), second succeeds."""
        mock_iframe = MagicMock()
        mock_iframe.is_iframe = True
        mock_body = MagicMock(name='body')
        mock_iframe._find_element = AsyncMock(return_value=mock_body)

        # First call: None (not found), second call: found
        self.mixin._find_element = AsyncMock(side_effect=[None, mock_iframe])

        with patch('asyncio.sleep') as mock_sleep, \
             patch('asyncio.get_event_loop') as mock_loop:
            mock_loop.return_value.time.side_effect = [0, 0.5, 1.0]

            result = await self.mixin.find_or_wait_element(
                By.CSS_SELECTOR, 'iframe > body', timeout=5
            )

        assert result is mock_body
        mock_sleep.assert_called_once_with(0.5)

    @pytest.mark.asyncio
    async def test_timeout_expires_raises(self):
        """All attempts fail — WaitElementTimeout raised."""
        self.mixin._find_element = AsyncMock(return_value=None)

        with patch('asyncio.sleep') as mock_sleep, \
             patch('asyncio.get_event_loop') as mock_loop:
            mock_loop.return_value.time.side_effect = [0, 0.5, 1.0, 1.5, 2.1]

            with pytest.raises(WaitElementTimeout, match='across iframes'):
                await self.mixin.find_or_wait_element(
                    By.CSS_SELECTOR, 'iframe > body', timeout=2
                )

    @pytest.mark.asyncio
    async def test_no_timeout_raises_element_not_found(self):
        """timeout=0, iframe not found — ElementNotFound."""
        self.mixin._find_element = AsyncMock(return_value=None)

        with pytest.raises(ElementNotFound, match='across iframes'):
            await self.mixin.find_or_wait_element(
                By.CSS_SELECTOR, 'iframe > body', timeout=0
            )

    @pytest.mark.asyncio
    async def test_raise_exc_false_returns_none(self):
        """raise_exc=False, not found — returns None."""
        self.mixin._find_element = AsyncMock(return_value=None)

        result = await self.mixin.find_or_wait_element(
            By.CSS_SELECTOR, 'iframe > body', timeout=0, raise_exc=False
        )
        assert result is None

    @pytest.mark.asyncio
    async def test_raise_exc_false_find_all_returns_empty(self):
        """raise_exc=False, find_all=True — returns []."""
        self.mixin._find_element = AsyncMock(return_value=None)

        result = await self.mixin.find_or_wait_element(
            By.CSS_SELECTOR, 'iframe > body', timeout=0, find_all=True, raise_exc=False
        )
        assert result == []

    @pytest.mark.asyncio
    async def test_intermediate_not_iframe_returns_none_and_raises(self):
        """Element found but is_iframe=False — treated as not found."""
        mock_element = MagicMock()
        mock_element.is_iframe = False

        self.mixin._find_element = AsyncMock(return_value=mock_element)

        with pytest.raises(ElementNotFound):
            await self.mixin.find_or_wait_element(
                By.CSS_SELECTOR, 'iframe > body', timeout=0
            )

    @pytest.mark.asyncio
    async def test_regular_selector_no_iframe_passthrough(self):
        """'div > span' — parser returns 1 segment, uses normal path."""
        mock_element = MagicMock()
        self.mixin._find_element = AsyncMock(return_value=mock_element)

        result = await self.mixin.find_or_wait_element(
            By.CSS_SELECTOR, 'div > span', timeout=0
        )

        # Should call _find_element directly with original selector
        self.mixin._find_element.assert_called_once_with(
            By.CSS_SELECTOR, 'div > span', raise_exc=True
        )


================================================
FILE: tests/test_har_recording_integration.py
================================================
"""Integration tests for HAR recording feature.

These tests open a real browser, serve a test page with JS-initiated
fetch requests via a local HTTP server, and verify the recorded HAR entries.
"""

import asyncio
import json
import socket
import threading
from http.server import HTTPServer, BaseHTTPRequestHandler
from pathlib import Path

import pytest

from pydoll.browser.chromium import Chrome
from pydoll.browser.requests.har_recorder import HarCapture


def _find_free_port():
    """Find a free port on localhost."""
    with socket.socket(socket.AF_INET, socket.SOCK_STREAM) as s:
        s.bind(('127.0.0.1', 0))
        return s.getsockname()[1]


class _TestAPIHandler(BaseHTTPRequestHandler):
    """Deterministic HTTP handler for HAR integration tests."""

    def do_GET(self):
        if self.path == '/api/users':
            self._respond(
                200,
                'application/json',
                json.dumps([{'id': 1, 'name': 'Alice'}, {'id': 2, 'name': 'Bob'}]),
            )
        elif self.path == '/api/data':
            self._respond(200, 'text/plain', 'Hello from the test server')
        else:
            self._respond(404, 'text/plain', 'Not Found')

    def do_POST(self):
        if self.path == '/api/submit':
            content_length = int(self.headers.get('Content-Length', 0))
            body = self.rfile.read(content_length)
            self._respond(
                201,
                'application/json',
                json.dumps({
                    'status': 'created',
                    'received': json.loads(body.decode()) if body else None,
                }),
            )
        else:
            self._respond(404, 'text/plain', 'Not Found')

    def _respond(self, status, content_type, body):
        self.send_response(status)
        self.send_header('Content-Type', content_type)
        self.send_header('Access-Control-Allow-Origin', '*')
        self.send_header('Access-Control-Allow-Headers', 'Content-Type')
        self.end_headers()
        self.wfile.write(body.encode())

    def do_OPTIONS(self):
        self.send_response(200)
        self.send_header('Access-Control-Allow-Origin', '*')
        self.send_header('Access-Control-Allow-Methods', 'GET, POST, OPTIONS')
        self.send_header('Access-Control-Allow-Headers', 'Content-Type')
        self.end_headers()

    def log_message(self, format, *args):
        pass


@pytest.fixture(scope='module')
def api_server():
    """Start a local HTTP server for the test module."""
    port = _find_free_port()
    server = HTTPServer(('127.0.0.1', port), _TestAPIHandler)
    thread = threading.Thread(target=server.serve_forever, daemon=True)
    thread.start()
    yield f'http://127.0.0.1:{port}'
    server.shutdown()
    server.server_close()
    thread.join(timeout=5)


@pytest.fixture(scope='module')
def test_page_path():
    """Path to the HAR recording test HTML page."""
    return Path(__file__).parent / 'pages' / 'test_har_recording.html'


async def _wait_for_requests_done(tab, timeout=15):
    """Poll the page until status shows 'done'."""
    for _ in range(int(timeout / 0.5)):
        await asyncio.sleep(0.5)
        status_el = await tab.find(id='status')
        text = await status_el.text
        if text == 'done':
            return True
    return False


class TestHarRecordIntegration:
    """Integration tests for tab.request.record()."""

    @pytest.mark.asyncio
    async def test_record_captures_page_load(self, ci_chrome_options, api_server, test_page_path):
        """Recording captures the document load event."""
        page_url = f'file://{test_page_path.absolute()}?base={api_server}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()

            async with tab.request.record() as recording:
                await tab.go_to(page_url)
                assert await _wait_for_requests_done(tab), 'Page requests did not complete'
                await asyncio.sleep(1)

            assert isinstance(recording, HarCapture)
            entries = recording.entries
            assert len(entries) >= 1

            # First entry should be the document load
            doc_entries = [
                e for e in entries if e['request']['url'].startswith('file://')
            ]
            assert len(doc_entries) >= 1
            assert doc_entries[0]['response']['status'] == 200
            assert doc_entries[0]['response']['content']['mimeType'] == 'text/html'

    @pytest.mark.asyncio
    async def test_record_captures_fetch_requests(
        self, ci_chrome_options, api_server, test_page_path
    ):
        """Recording captures JS fetch() requests with correct URLs and methods."""
        page_url = f'file://{test_page_path.absolute()}?base={api_server}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()

            async with tab.request.record() as recording:
                await tab.go_to(page_url)
                assert await _wait_for_requests_done(tab), 'Page requests did not complete'
                await asyncio.sleep(1)

            entries = recording.entries
            api_entries = [e for e in entries if '/api/' in e['request']['url']]
            # 3 API requests + possible OPTIONS preflight for POST
            assert len(api_entries) >= 3

            urls = [e['request']['url'] for e in api_entries]
            assert any('/api/users' in u for u in urls)
            assert any('/api/data' in u for u in urls)
            assert any('/api/submit' in u for u in urls)

    @pytest.mark.asyncio
    async def test_record_captures_response_bodies(
        self, ci_chrome_options, api_server, test_page_path
    ):
        """Recording captures response bodies for each request."""
        page_url = f'file://{test_page_path.absolute()}?base={api_server}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()

            async with tab.request.record() as recording:
                await tab.go_to(page_url)
                assert await _wait_for_requests_done(tab), 'Page requests did not complete'
                await asyncio.sleep(1)

            entries = recording.entries
            users_entry = next(
                (e for e in entries if '/api/users' in e['request']['url']), None
            )
            assert users_entry is not None
            body_text = users_entry['response']['content'].get('text', '')
            assert 'Alice' in body_text
            assert 'Bob' in body_text

            data_entry = next(
                (e for e in entries if '/api/data' in e['request']['url']), None
            )
            assert data_entry is not None
            assert 'Hello from the test server' in data_entry['response']['content'].get('text', '')

    @pytest.mark.asyncio
    async def test_record_captures_post_request(
        self, ci_chrome_options, api_server, test_page_path
    ):
        """Recording captures POST requests with body data."""
        page_url = f'file://{test_page_path.absolute()}?base={api_server}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()

            async with tab.request.record() as recording:
                await tab.go_to(page_url)
                assert await _wait_for_requests_done(tab), 'Page requests did not complete'
                await asyncio.sleep(1)

            entries = recording.entries
            post_entry = next(
                (
                    e
                    for e in entries
                    if '/api/submit' in e['request']['url']
                    and e['request']['method'] == 'POST'
                ),
                None,
            )
            assert post_entry is not None
            assert post_entry['response']['status'] == 201

            # POST body should be captured
            post_data = post_entry['request'].get('postData')
            assert post_data is not None
            assert '"key"' in post_data['text']

            # Response body should contain what the server echoed back
            resp_text = post_entry['response']['content'].get('text', '')
            assert 'created' in resp_text

    @pytest.mark.asyncio
    async def test_record_correct_status_codes(
        self, ci_chrome_options, api_server, test_page_path
    ):
        """Recording captures correct HTTP status codes."""
        page_url = f'file://{test_page_path.absolute()}?base={api_server}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()

            async with tab.request.record() as recording:
                await tab.go_to(page_url)
                assert await _wait_for_requests_done(tab), 'Page requests did not complete'
                await asyncio.sleep(1)

            entries = recording.entries
            users_entry = next(
                (e for e in entries if '/api/users' in e['request']['url']), None
            )
            assert users_entry is not None
            assert users_entry['response']['status'] == 200

            submit_entry = next(
                (
                    e
                    for e in entries
                    if '/api/submit' in e['request']['url']
                    and e['request']['method'] == 'POST'
                ),
                None,
            )
            assert submit_entry is not None
            assert submit_entry['response']['status'] == 201

    @pytest.mark.asyncio
    async def test_record_body_sizes(self, ci_chrome_options, api_server, test_page_path):
        """Recording reports correct body sizes from dataReceived events."""
        page_url = f'file://{test_page_path.absolute()}?base={api_server}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()

            async with tab.request.record() as recording:
                await tab.go_to(page_url)
                assert await _wait_for_requests_done(tab), 'Page requests did not complete'
                await asyncio.sleep(1)

            entries = recording.entries
            users_entry = next(
                (e for e in entries if '/api/users' in e['request']['url']), None
            )
            assert users_entry is not None
            # bodySize should be > 0 for successful requests with body
            assert users_entry['response']['bodySize'] > 0
            # content.size should match the decoded body length
            assert users_entry['response']['content']['size'] > 0


class TestHarSaveIntegration:
    """Integration tests for saving and loading HAR files."""

    @pytest.mark.asyncio
    async def test_save_produces_valid_har(
        self, ci_chrome_options, api_server, test_page_path, tmp_path
    ):
        """Saved HAR file is valid JSON with HAR 1.2 structure."""
        page_url = f'file://{test_page_path.absolute()}?base={api_server}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()

            async with tab.request.record() as recording:
                await tab.go_to(page_url)
                assert await _wait_for_requests_done(tab), 'Page requests did not complete'
                await asyncio.sleep(1)

            har_path = tmp_path / 'test_output.har'
            recording.save(har_path)

            assert har_path.exists()
            with open(har_path, encoding='utf-8') as f:
                har = json.load(f)

            assert har['log']['version'] == '1.2'
            assert har['log']['creator']['name'] == 'pydoll'
            assert isinstance(har['log']['pages'], list)
            assert isinstance(har['log']['entries'], list)
            assert len(har['log']['entries']) >= 4

    @pytest.mark.asyncio
    async def test_save_entries_sorted_by_time(
        self, ci_chrome_options, api_server, test_page_path, tmp_path
    ):
        """Saved entries are sorted by startedDateTime."""
        page_url = f'file://{test_page_path.absolute()}?base={api_server}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()

            async with tab.request.record() as recording:
                await tab.go_to(page_url)
                assert await _wait_for_requests_done(tab), 'Page requests did not complete'
                await asyncio.sleep(1)

            har_path = tmp_path / 'test_sorted.har'
            recording.save(har_path)

            with open(har_path, encoding='utf-8') as f:
                har = json.load(f)

            dates = [e['startedDateTime'] for e in har['log']['entries']]
            assert dates == sorted(dates)

    @pytest.mark.asyncio
    async def test_save_entries_have_required_fields(
        self, ci_chrome_options, api_server, test_page_path, tmp_path
    ):
        """Every entry has required HAR 1.2 fields."""
        page_url = f'file://{test_page_path.absolute()}?base={api_server}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()

            async with tab.request.record() as recording:
                await tab.go_to(page_url)
                assert await _wait_for_requests_done(tab), 'Page requests did not complete'
                await asyncio.sleep(1)

            har_path = tmp_path / 'test_fields.har'
            recording.save(har_path)

            with open(har_path, encoding='utf-8') as f:
                har = json.load(f)

            for entry in har['log']['entries']:
                # Required entry fields
                assert 'startedDateTime' in entry
                assert 'time' in entry
                assert 'request' in entry
                assert 'response' in entry
                assert 'cache' in entry
                assert 'timings' in entry

                # Required request fields
                req = entry['request']
                assert 'method' in req
                assert 'url' in req
                assert 'httpVersion' in req
                assert 'cookies' in req
                assert 'headers' in req
                assert 'queryString' in req
                assert 'headersSize' in req
                assert 'bodySize' in req

                # Required response fields
                resp = entry['response']
                assert 'status' in resp
                assert 'statusText' in resp
                assert 'httpVersion' in resp
                assert 'cookies' in resp
                assert 'headers' in resp
                assert 'content' in resp
                assert 'redirectURL' in resp
                assert 'headersSize' in resp
                assert 'bodySize' in resp

                # Required timings fields
                timings = entry['timings']
                for field in ('blocked', 'dns', 'connect', 'ssl', 'send', 'wait', 'receive'):
                    assert field in timings


================================================
FILE: tests/test_iframe_integration.py
================================================
"""Integration tests for iframe functionality in WebElement.

These tests use real HTML files and Chrome browser to test iframe interactions,
element finding, and DOM manipulation within iframes.
"""

import asyncio
from pathlib import Path

import pytest

from pydoll.browser.chromium import Chrome
from pydoll.elements.web_element import WebElement
from pydoll.exceptions import ElementNotFound, InvalidIFrame


class TestSimpleIframeIntegration:
    """Integration tests for simple iframe operations."""

    @pytest.mark.asyncio
    async def test_find_element_in_iframe_by_id(self, ci_chrome_options):
        """Test finding an element inside an iframe by id."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)

            # Wait for iframe to load
            await asyncio.sleep(1)

            # Find the iframe element
            iframe_element = await tab.find(id='simple-iframe')
            assert iframe_element is not None
            assert iframe_element.is_iframe

            # Get iframe context
            iframe_context = await iframe_element.iframe_context
            assert iframe_context is not None
            assert iframe_context.frame_id is not None
            assert iframe_context.execution_context_id is not None

            # Find element inside iframe
            heading_in_iframe = await iframe_element.find(id='iframe-heading')
            assert heading_in_iframe is not None
            assert isinstance(heading_in_iframe, WebElement)

            # Verify the element text
            text = await heading_in_iframe.text
            assert 'Iframe Content' in text

    @pytest.mark.asyncio
    async def test_find_multiple_elements_in_iframe(self, ci_chrome_options):
        """Test finding multiple elements inside an iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            iframe_element = await tab.find(id='simple-iframe')

            # Find all links inside iframe
            links = await iframe_element.query('.iframe-link', find_all=True)
            assert len(links) == 3

            # Verify each link
            for i, link in enumerate(links, 1):
                link_id = link.get_attribute('id')
                assert link_id == f'iframe-link{i}'

    @pytest.mark.asyncio
    async def test_find_element_in_iframe_by_css_selector(self, ci_chrome_options):
        """Test finding elements in iframe using CSS selectors."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            iframe_element = await tab.find(id='simple-iframe')

            # Find by class
            action_buttons = await iframe_element.query('.action-btn', find_all=True)
            assert len(action_buttons) >= 2  # At least 2 visible buttons

            # Find by tag
            inputs = await iframe_element.query('input[type="text"]', find_all=True)
            assert len(inputs) >= 1

    @pytest.mark.asyncio
    async def test_find_element_in_iframe_by_xpath(self, ci_chrome_options):
        """Test finding elements in iframe using XPath."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            iframe_element = await tab.find(id='simple-iframe')

            # Find by XPath
            paragraph = await iframe_element.find(xpath='//p[@id="iframe-paragraph"]')
            assert paragraph is not None

            text = await paragraph.text
            assert 'content inside the iframe' in text

    @pytest.mark.asyncio
    async def test_insert_text_in_iframe_input(self, ci_chrome_options):
        """Test inserting text into an input field inside an iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            iframe_element = await tab.find(id='simple-iframe')

            # Find input inside iframe
            input_element = await iframe_element.find(id='iframe-input')
            assert input_element is not None

            # Insert text
            test_text = 'Test User Name'
            await input_element.insert_text(test_text)

            # Verify text was inserted
            value = input_element.get_attribute('value')
            assert test_text in value

    @pytest.mark.asyncio
    async def test_insert_text_in_iframe_textarea(self, ci_chrome_options):
        """Test inserting text into a textarea inside an iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            iframe_element = await tab.find(id='simple-iframe')

            # Find textarea inside iframe
            textarea = await iframe_element.find(id='iframe-textarea')
            assert textarea is not None

            # Insert new text (textarea initially empty)
            new_message = 'This is a new test message'
            await textarea.insert_text(new_message)

            # Verify text was inserted
            value = textarea.get_attribute('value')
            assert new_message in value

    @pytest.mark.asyncio
    async def test_click_button_in_iframe(self, ci_chrome_options):
        """Test clicking a button inside an iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            iframe_element = await tab.find(id='simple-iframe')

            # Find button inside iframe
            button = await iframe_element.find(id='iframe-button1')
            assert button is not None

            # Click the button (should not raise exception)
            await button.click()
            await asyncio.sleep(0.5)

    @pytest.mark.asyncio
    async def test_get_inner_html_of_iframe(self, ci_chrome_options):
        """Test getting inner HTML of an iframe element."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            iframe_element = await tab.find(id='simple-iframe')

            # Get inner HTML of the iframe
            inner_html = await iframe_element.inner_html
            assert inner_html is not None
            assert len(inner_html) > 0
            assert 'iframe-heading' in inner_html
            assert 'Iframe Content' in inner_html

    @pytest.mark.asyncio
    async def test_get_inner_html_of_element_in_iframe(self, ci_chrome_options):
        """Test getting inner HTML of an element inside an iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            iframe_element = await tab.find(id='simple-iframe')

            # Find container inside iframe
            container = await iframe_element.find(id='iframe-container')
            assert container is not None

            # Get inner HTML
            inner_html = await container.inner_html
            assert inner_html is not None
            assert 'iframe-paragraph' in inner_html
            assert 'iframe-form' in inner_html

    @pytest.mark.asyncio
    async def test_get_children_elements_in_iframe(self, ci_chrome_options):
        """Test getting children elements of an element inside an iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            iframe_element = await tab.find(id='simple-iframe')

            # Find list inside iframe
            list_element = await iframe_element.find(id='iframe-list')
            assert list_element is not None

            # Get list items using tag filter to avoid relying on class attributes
            list_items = await list_element.get_children_elements(max_depth=2, tag_filter=['li'])
            assert len(list_items) == 3

    @pytest.mark.asyncio
    async def test_element_visibility_in_iframe(self, ci_chrome_options):
        """Test checking element visibility inside an iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            iframe_element = await tab.find(id='simple-iframe')

            # Find visible button
            visible_button = await iframe_element.find(id='iframe-button1')
            is_visible = await visible_button.is_visible()
            assert is_visible is True

            # Find hidden button
            hidden_button = await iframe_element.find(id='iframe-button3')
            is_hidden = await hidden_button.is_visible()
            assert is_hidden is False


class TestNestedIframeIntegration:
    """Integration tests for nested iframe operations."""

    @pytest.mark.asyncio
    async def test_find_element_in_parent_iframe(self, ci_chrome_options):
        """Test finding an element in parent iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_nested.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1.5)

            # Find parent iframe
            parent_iframe = await tab.find(id='parent-iframe')
            assert parent_iframe is not None
            assert parent_iframe.is_iframe

            # Find element in parent iframe
            parent_heading = await parent_iframe.find(id='parent-iframe-heading')
            assert parent_heading is not None

            text = await parent_heading.text
            assert 'Parent Iframe Content' in text

    @pytest.mark.asyncio
    async def test_find_nested_iframe_element(self, ci_chrome_options):
        """Test finding the nested iframe element inside parent iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_nested.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1.5)

            # Find parent iframe
            parent_iframe = await tab.find(id='parent-iframe')

            # Find nested iframe inside parent iframe
            nested_iframe = await parent_iframe.find(id='nested-iframe')
            assert nested_iframe is not None
            assert nested_iframe.is_iframe

    @pytest.mark.asyncio
    async def test_find_element_in_nested_iframe(self, ci_chrome_options):
        """Test finding an element in nested iframe (iframe within iframe)."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_nested.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(2)

            # Find parent iframe
            parent_iframe = await tab.find(id='parent-iframe')

            # Find nested iframe inside parent
            nested_iframe = await parent_iframe.find(id='nested-iframe')
            assert nested_iframe is not None

            # Find element in nested iframe
            nested_heading = await nested_iframe.find(id='nested-iframe-heading')
            assert nested_heading is not None

            text = await nested_heading.text
            assert 'Nested Iframe Content' in text

    @pytest.mark.asyncio
    async def test_insert_text_in_nested_iframe(self, ci_chrome_options):
        """Test inserting text into input field in nested iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_nested.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(2)

            # Navigate to nested iframe
            parent_iframe = await tab.find(id='parent-iframe')
            nested_iframe = await parent_iframe.find(id='nested-iframe')

            # Find input in nested iframe
            nested_input = await nested_iframe.find(id='nested-input')
            assert nested_input is not None

            # Insert text
            test_text = 'Nested Input Test'
            await nested_input.insert_text(test_text)

            # Verify
            value = nested_input.get_attribute('value')
            assert test_text in value

    @pytest.mark.asyncio
    async def test_find_multiple_elements_in_nested_iframe(self, ci_chrome_options):
        """Test finding multiple elements in nested iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_nested.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(2)

            # Navigate to nested iframe
            parent_iframe = await tab.find(id='parent-iframe')
            nested_iframe = await parent_iframe.find(id='nested-iframe')

            # Find all links in nested iframe
            links = await nested_iframe.query('a', find_all=True)
            assert len(links) == 2

            # Verify link IDs
            link_ids = [link.get_attribute('id') for link in links]
            assert 'nested-link1' in link_ids
            assert 'nested-link2' in link_ids

    @pytest.mark.asyncio
    async def test_submit_form_in_nested_iframe(self, ci_chrome_options):
        """Test interacting with form elements in nested iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_nested.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(2)

            # Navigate to nested iframe
            parent_iframe = await tab.find(id='parent-iframe')
            nested_iframe = await parent_iframe.find(id='nested-iframe')

            # Fill form fields
            username_input = await nested_iframe.find(id='nested-form-input')
            await username_input.insert_text('testuser')

            password_input = await nested_iframe.find(id='nested-form-password')
            await password_input.insert_text('password123')

            # Verify values
            assert 'testuser' in username_input.get_attribute('value')
            assert 'password123' in password_input.get_attribute('value')

            # Click submit button
            submit_button = await nested_iframe.find(id='nested-form-submit')
            await submit_button.click()
            await asyncio.sleep(0.5)


class TestIframeElementInteraction:
    """Integration tests for various element interactions within iframes."""

    @pytest.mark.asyncio
    async def test_select_option_in_iframe(self, ci_chrome_options):
        """Test selecting an option in a select element inside iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            iframe_element = await tab.find(id='simple-iframe')

            # Find select element
            select_element = await iframe_element.find(id='iframe-select')
            assert select_element is not None

            # Select option2 by clicking the option element
            option2 = await select_element.find(xpath='.//option[@value="option2"]')
            await option2.click()
            await asyncio.sleep(0.2)
            # Verify via property read (execute_script)
            prop_val = await select_element.execute_script('return this.value', return_by_value=True)
            current_value = prop_val['result']['result']['value']
            assert current_value == 'option2'

            # Select different option (option3) by clicking it
            option3 = await select_element.find(xpath='.//option[@value="option3"]')
            await option3.click()
            await asyncio.sleep(0.2)
            prop_val2 = await select_element.execute_script('return this.value', return_by_value=True)
            new_value = prop_val2['result']['result']['value']
            assert new_value == 'option3'

    @pytest.mark.asyncio
    async def test_get_attributes_from_iframe_elements(self, ci_chrome_options):
        """Test getting various attributes from elements in iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            iframe_element = await tab.find(id='simple-iframe')

            # Get link attributes
            link = await iframe_element.find(id='iframe-link1')
            href = link.get_attribute('href')
            assert href is not None
            assert '#link1' in href

            link_class = link.get_attribute('class')
            assert 'iframe-link' in link_class

            # Get input attributes
            input_elem = await iframe_element.find(id='iframe-input')
            input_type = input_elem.get_attribute('type')
            assert input_type == 'text'

            placeholder = input_elem.get_attribute('placeholder')
            assert 'name' in placeholder.lower()

    @pytest.mark.asyncio
    async def test_deep_nested_element_search_in_iframe(self, ci_chrome_options):
        """Test finding deeply nested elements inside iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            iframe_element = await tab.find(id='simple-iframe')

            # Find deeply nested element
            deep_span = await iframe_element.find(id='deep-span')
            assert deep_span is not None

            text = await deep_span.text
            assert 'Deep nested element' in text


    @pytest.mark.asyncio
    async def test_wait_for_element_in_iframe(self, ci_chrome_options):
        """Test waiting for element to appear in iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            iframe_element = await tab.find(id='simple-iframe')

            # Wait for element (should already exist)
            element = await iframe_element.find(
                id='iframe-paragraph', timeout=5
            )
            assert element is not None

            text = await element.text
            assert 'content inside the iframe' in text

    @pytest.mark.asyncio
    async def test_element_not_found_in_iframe(self, ci_chrome_options):
        """Test that ElementNotFound is raised for non-existent elements in iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            iframe_element = await tab.find(id='simple-iframe')

            # Try to find non-existent element
            with pytest.raises(ElementNotFound):
                await iframe_element.find(id='non-existent-element')

    @pytest.mark.asyncio
    async def test_clear_input_in_iframe(self, ci_chrome_options):
        """Test clearing input field in iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            iframe_element = await tab.find(id='simple-iframe')

            # Find input and add text
            input_elem = await iframe_element.find(id='iframe-input')
            await input_elem.insert_text('Test text to clear')
            await asyncio.sleep(0.3)

            await input_elem.insert_text('')
            await asyncio.sleep(0.3)
            value = input_elem.get_attribute('value')
            assert value in ('', None)

    @pytest.mark.asyncio
    async def test_multiple_iframes_on_same_page(self, ci_chrome_options):
        """Test handling multiple iframes on the same page."""
        # Create a test page with multiple iframes
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            # Find main content (not in iframe)
            main_heading = await tab.find(id='main-heading')
            assert main_heading is not None
            main_text = await main_heading.text
            assert 'Main Page' in main_text

            # Find content in iframe
            iframe_element = await tab.find(id='simple-iframe')
            iframe_heading = await iframe_element.find(id='iframe-heading')
            iframe_text = await iframe_heading.text
            assert 'Iframe Content' in iframe_text

            # Verify they are different
            assert main_text != iframe_text

    @pytest.mark.asyncio
    async def test_iframe_context_persistence(self, ci_chrome_options):
        """Test that iframe context persists across multiple operations."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            iframe_element = await tab.find(id='simple-iframe')

            # Get context first time
            context1 = await iframe_element.iframe_context
            assert context1 is not None

            # Perform some operations
            element1 = await iframe_element.find(id='iframe-heading')
            await element1.text

            # Get context again
            context2 = await iframe_element.iframe_context
            assert context2 is not None

            # Verify contexts are consistent
            assert context1.frame_id == context2.frame_id
            assert context1.execution_context_id == context2.execution_context_id

    @pytest.mark.asyncio
    async def test_get_text_from_multiple_elements_in_iframe(self, ci_chrome_options):
        """Test getting text from multiple elements in iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            iframe_element = await tab.find(id='simple-iframe')

            # Get all list items
            list_items = await iframe_element.query('.list-item', find_all=True)
            assert len(list_items) == 3

            # Get text from each
            texts = []
            for item in list_items:
                text = await item.text
                texts.append(text)

            # Verify texts
            assert 'Item 1' in texts[0]
            assert 'Item 2' in texts[1]
            assert 'Item 3' in texts[2]


class TestMultipleIframesSelection:
    """Integration tests for selecting the correct iframe when multiple iframes exist."""

    @pytest.mark.asyncio
    async def test_find_specific_iframe_by_id_among_multiple(self, ci_chrome_options):
        """Test finding a specific iframe by ID when multiple iframes exist on the page."""
        test_file = Path(__file__).parent / 'pages' / 'test_multiple_iframes.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            # Find all iframes
            all_iframes = await tab.find(tag_name='iframe', find_all=True)
            assert len(all_iframes) == 3, "Should have 3 iframes on the page"

            # Find specific iframe by ID
            login_iframe = await tab.find(id='login-iframe')
            assert login_iframe is not None
            assert login_iframe.is_iframe
            assert login_iframe.get_attribute('id') == 'login-iframe'

            # Verify we can access content in the correct iframe
            iframe_context = await login_iframe.iframe_context
            assert iframe_context is not None
            assert iframe_context.frame_id is not None

    @pytest.mark.asyncio
    async def test_find_elements_in_correct_iframe_among_multiple(self, ci_chrome_options):
        """Test that elements are found in the correct iframe when multiple exist."""
        test_file = Path(__file__).parent / 'pages' / 'test_multiple_iframes.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            # Get the login iframe specifically
            login_iframe = await tab.find(id='login-iframe')
            
            # Find elements inside the login iframe
            heading = await login_iframe.find(id='iframe-heading', timeout=5)
            assert heading is not None
            
            text = await heading.text
            assert 'Iframe Content' in text

            # Verify we can find multiple elements
            buttons = await login_iframe.find(class_name='action-btn', find_all=True)
            assert len(buttons) >= 2

    @pytest.mark.asyncio
    async def test_different_iframes_have_different_contexts(self, ci_chrome_options):
        """Test that different iframes have distinct frame contexts even with same content."""
        test_file = Path(__file__).parent / 'pages' / 'test_multiple_iframes.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            # Get two different iframes
            cookie_iframe = await tab.find(id='cookie-iframe')
            login_iframe = await tab.find(id='login-iframe')

            # Both should be iframes
            assert cookie_iframe.is_iframe
            assert login_iframe.is_iframe

            # Get their contexts
            cookie_ctx = await cookie_iframe.iframe_context
            login_ctx = await login_iframe.iframe_context

            # Frame IDs should be different (distinct iframe contexts)
            assert cookie_ctx.frame_id != login_ctx.frame_id

            # Both should be able to find elements in their respective content
            cookie_heading = await cookie_iframe.find(id='iframe-heading')
            login_heading = await login_iframe.find(id='iframe-heading')
            
            assert cookie_heading is not None
            assert login_heading is not None
            
            # The element object IDs should be different (different DOM instances)
            assert cookie_heading._object_id != login_heading._object_id

    @pytest.mark.asyncio
    async def test_iframe_selection_by_data_attribute(self, ci_chrome_options):
        """Test selecting iframe by custom data attribute."""
        test_file = Path(__file__).parent / 'pages' / 'test_multiple_iframes.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            # Find iframe by data-purpose attribute using xpath
            login_iframe = await tab.find(xpath='//iframe[@data-purpose="login"]')
            assert login_iframe is not None
            assert login_iframe.get_attribute('id') == 'login-iframe'

            # Verify we can interact with it
            form = await login_iframe.find(id='iframe-form')
            assert form is not None

    @pytest.mark.asyncio
    async def test_iterate_over_multiple_iframes(self, ci_chrome_options):
        """Test iterating over multiple iframes and accessing each one's content."""
        test_file = Path(__file__).parent / 'pages' / 'test_multiple_iframes.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            # Find all iframes
            all_iframes = await tab.find(tag_name='iframe', find_all=True)
            assert len(all_iframes) == 3

            # Each iframe should have accessible content
            for iframe in all_iframes:
                assert iframe.is_iframe
                
                # Get context for each iframe
                ctx = await iframe.iframe_context
                assert ctx is not None
                assert ctx.frame_id is not None
                
                # Each should have an iframe-heading
                heading = await iframe.find(id='iframe-heading', raise_exc=False)
                # At least the content iframes should have the heading
                if heading:
                    text = await heading.text
                    assert len(text) > 0

    @pytest.mark.asyncio
    async def test_find_in_iframe_after_finding_in_another(self, ci_chrome_options):
        """Test finding elements in one iframe after finding in another."""
        test_file = Path(__file__).parent / 'pages' / 'test_multiple_iframes.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            # First, find element in cookie iframe
            cookie_iframe = await tab.find(id='cookie-iframe')
            cookie_heading = await cookie_iframe.find(id='iframe-heading')
            cookie_text = await cookie_heading.text

            # Then, find element in login iframe
            login_iframe = await tab.find(id='login-iframe')
            login_heading = await login_iframe.find(id='iframe-heading')
            login_text = await login_heading.text

            # Both should work independently
            assert 'Iframe Content' in cookie_text
            assert 'Iframe Content' in login_text

            # Now find in analytics iframe
            analytics_iframe = await tab.find(id='analytics-iframe')
            analytics_heading = await analytics_iframe.find(id='iframe-heading')
            analytics_text = await analytics_heading.text

            assert 'Iframe Content' in analytics_text


class TestIframeEdgeCases:
    """Integration tests for edge cases in iframe handling."""

    @pytest.mark.asyncio
    async def test_dynamic_content_in_iframe(self, ci_chrome_options):
        """Test finding dynamically added content in iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            iframe_element = await tab.find(id='simple-iframe')

            # Add dynamic content via JavaScript
            iframe_context = await iframe_element.iframe_context
            await tab.execute_script(
                """
                const div = document.createElement('div');
                div.id = 'dynamic-element';
                div.textContent = 'Dynamic Content';
                document.body.appendChild(div);
                """,
                context_id=iframe_context.execution_context_id,
            )
            await asyncio.sleep(0.5)

            # Find dynamically added element
            dynamic_element = await iframe_element.find(id='dynamic-element')
            assert dynamic_element is not None

            text = await dynamic_element.text
            assert 'Dynamic Content' in text

    @pytest.mark.asyncio
    async def test_iframe_reload_handling(self, ci_chrome_options):
        """Test that iframe context is properly handled after page reload."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            # Find iframe and element
            iframe_element = await tab.find(id='simple-iframe')
            element_before = await iframe_element.find(id='iframe-heading')
            assert element_before is not None

            # Reload page
            await tab.refresh()
            await asyncio.sleep(1)

            # Find iframe again (new instance)
            iframe_element_after = await tab.find(id='simple-iframe')
            element_after = await iframe_element_after.find(id='iframe-heading')
            assert element_after is not None

            # Verify element is accessible
            text = await element_after.text
            assert 'Iframe Content' in text


class TestIframeTypeText:
    """Integration tests for type_text inside iframes."""

    @pytest.mark.asyncio
    async def test_type_text_in_iframe_input(self, ci_chrome_options):
        """type_text should work inside an iframe input."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            iframe_element = await tab.find(id='simple-iframe')
            input_el = await iframe_element.find(id='iframe-input')

            await input_el.type_text('hello')
            await asyncio.sleep(0.3)

            prop = await input_el.execute_script(
                'return this.value', return_by_value=True
            )
            assert prop['result']['result']['value'] == 'hello'

    @pytest.mark.asyncio
    async def test_type_text_humanized_in_iframe_input(self, ci_chrome_options):
        """type_text with humanize=True should work inside an iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            iframe_element = await tab.find(id='simple-iframe')
            input_el = await iframe_element.find(id='iframe-input')

            await input_el.type_text('Test', humanize=True)
            await asyncio.sleep(0.3)

            prop = await input_el.execute_script(
                'return this.value', return_by_value=True
            )
            value = prop['result']['result']['value']
            # Humanized typing may introduce and correct typos,
            # but the final value should be non-empty.
            assert len(value) >= 2

    @pytest.mark.asyncio
    async def test_type_text_email_in_iframe_input(self, ci_chrome_options):
        """type_text should handle symbols like @ and . inside iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_iframe_simple.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            iframe_element = await tab.find(id='simple-iframe')
            input_el = await iframe_element.find(id='iframe-email')

            test_text = 'user@test.com'
            await input_el.type_text(test_text)
            await asyncio.sleep(0.3)

            prop = await input_el.execute_script(
                'return this.value', return_by_value=True
            )
            assert prop['result']['result']['value'] == test_text


class TestFrameElementIntegration:
    """Integration tests for <frame> elements (frameset pages)."""

    @pytest.mark.asyncio
    async def test_frame_element_is_iframe(self, ci_chrome_options):
        """Test that a <frame> element is recognized as an iframe."""
        test_file = Path(__file__).parent / 'pages' / 'test_frameset.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            frame_element = await tab.find(id='left-frame', timeout=5)
            assert frame_element is not None
            assert frame_element.tag_name == 'frame'
            assert frame_element.is_iframe

    @pytest.mark.asyncio
    async def test_find_element_inside_frame(self, ci_chrome_options):
        """Test finding an element inside a <frame> element."""
        test_file = Path(__file__).parent / 'pages' / 'test_frameset.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            frame_element = await tab.find(id='left-frame', timeout=5)
            heading = await frame_element.find(id='frame-heading', timeout=5)
            assert heading is not None

            text = await heading.text
            assert 'Frame Content' in text

    @pytest.mark.asyncio
    async def test_frame_context_is_resolved(self, ci_chrome_options):
        """Test that iframe_context works for <frame> elements."""
        test_file = Path(__file__).parent / 'pages' / 'test_frameset.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            frame_element = await tab.find(id='left-frame', timeout=5)
            ctx = await frame_element.iframe_context
            assert ctx is not None
            assert ctx.frame_id is not None
            assert ctx.execution_context_id is not None

    @pytest.mark.asyncio
    async def test_inner_html_of_frame(self, ci_chrome_options):
        """Test that inner_html works for <frame> elements."""
        test_file = Path(__file__).parent / 'pages' / 'test_frameset.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            frame_element = await tab.find(id='left-frame', timeout=5)
            html = await frame_element.inner_html
            assert 'frame-heading' in html

    @pytest.mark.asyncio
    async def test_multiple_frames_in_frameset(self, ci_chrome_options):
        """Test interacting with multiple <frame> elements in a frameset."""
        test_file = Path(__file__).parent / 'pages' / 'test_frameset.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            left_frame = await tab.find(id='left-frame', timeout=5)
            right_frame = await tab.find(id='right-frame', timeout=5)

            assert left_frame.is_iframe
            assert right_frame.is_iframe

            # Left frame has frame-specific content
            left_heading = await left_frame.find(id='frame-heading', timeout=5)
            left_text = await left_heading.text
            assert 'Frame Content' in left_text

            # Right frame has iframe content (reuses test_iframe_content.html)
            right_heading = await right_frame.find(id='iframe-heading', timeout=5)
            right_text = await right_heading.text
            assert 'Iframe Content' in right_text

    @pytest.mark.asyncio
    async def test_type_text_in_frame_input(self, ci_chrome_options):
        """Test typing text into an input inside a <frame> element."""
        test_file = Path(__file__).parent / 'pages' / 'test_frameset.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)
            await asyncio.sleep(1)

            frame_element = await tab.find(id='left-frame', timeout=5)
            input_el = await frame_element.find(id='frame-input', timeout=5)

            test_text = 'hello frame'
            await input_el.type_text(test_text)
            await asyncio.sleep(0.3)

            prop = await input_el.execute_script(
                'return this.value', return_by_value=True
            )
            assert prop['result']['result']['value'] == test_text


================================================
FILE: tests/test_interactions/__init__.py
================================================


================================================
FILE: tests/test_interactions/test_iframe.py
================================================
"""Unit tests for IFrameContextResolver and IFrameContext."""

import pytest
import pytest_asyncio
from unittest.mock import AsyncMock, MagicMock, patch

from pydoll.interactions.iframe import IFrameContext, IFrameContextResolver
from pydoll.exceptions import InvalidIFrame


@pytest_asyncio.fixture
async def mock_element():
    """Create a mock WebElement for tests."""
    element = MagicMock()
    element._object_id = 'mock-object-id'
    element._connection_handler = MagicMock()
    element._connection_handler.execute_command = AsyncMock()
    element._connection_handler._connection_port = 9222
    element._describe_node = AsyncMock()
    return element


@pytest_asyncio.fixture
async def resolver(mock_element):
    """Create IFrameContextResolver with mocked element."""
    return IFrameContextResolver(mock_element)


class TestIFrameContext:
    """Test IFrameContext dataclass."""

    def test_default_values(self):
        """Test IFrameContext with only required field."""
        context = IFrameContext(frame_id='test-frame-id')

        assert context.frame_id == 'test-frame-id'
        assert context.document_url is None
        assert context.execution_context_id is None
        assert context.document_object_id is None
        assert context.session_handler is None
        assert context.session_id is None

    def test_all_values(self):
        """Test IFrameContext with all fields set."""
        mock_handler = MagicMock()

        context = IFrameContext(
            frame_id='frame-123',
            document_url='https://example.com',
            execution_context_id=42,
            document_object_id='doc-obj-456',
            session_handler=mock_handler,
            session_id='session-789',
        )

        assert context.frame_id == 'frame-123'
        assert context.document_url == 'https://example.com'
        assert context.execution_context_id == 42
        assert context.document_object_id == 'doc-obj-456'
        assert context.session_handler is mock_handler
        assert context.session_id == 'session-789'


class TestIFrameContextResolverInit:
    """Test IFrameContextResolver initialization."""

    def test_initialization(self, mock_element):
        """Test resolver stores element reference."""
        resolver = IFrameContextResolver(mock_element)

        assert resolver._element is mock_element


class TestGetBaseSession:
    """Test _get_base_session method."""

    def test_get_base_session_default(self, mock_element):
        """Test _get_base_session returns connection handler when no routing session."""
        # Explicitly set routing session to None to simulate no routing
        mock_element._routing_session_handler = None
        mock_element._routing_session_id = None

        resolver = IFrameContextResolver(mock_element)
        handler, session_id = resolver._get_base_session()

        assert handler is mock_element._connection_handler
        assert session_id is None

    def test_get_base_session_with_routing_session(self, mock_element):
        """Test _get_base_session returns routing session when set."""
        mock_routing_handler = MagicMock()
        mock_element._routing_session_handler = mock_routing_handler
        mock_element._routing_session_id = 'routing-session-123'

        resolver = IFrameContextResolver(mock_element)
        handler, session_id = resolver._get_base_session()

        assert handler is mock_routing_handler
        assert session_id == 'routing-session-123'


class TestExtractFrameMetadata:
    """Test _extract_frame_metadata static method."""

    def test_extract_with_content_document(self):
        """Test extracting metadata when contentDocument is present."""
        node_info = {
            'contentDocument': {
                'frameId': 'content-frame-id',
                'documentURL': 'https://iframe.example.com',
            },
            'frameId': 'parent-frame-id',
            'backendNodeId': 123,
        }

        frame_id, doc_url, parent_id, backend_id = (
            IFrameContextResolver._extract_frame_metadata(node_info)
        )

        assert frame_id == 'content-frame-id'
        assert doc_url == 'https://iframe.example.com'
        assert parent_id == 'parent-frame-id'
        assert backend_id == 123

    def test_extract_without_content_document(self):
        """Test extracting metadata when contentDocument is missing."""
        node_info = {
            'frameId': 'parent-frame-id',
            'backendNodeId': 456,
            'documentURL': 'https://fallback.example.com',
        }

        frame_id, doc_url, parent_id, backend_id = (
            IFrameContextResolver._extract_frame_metadata(node_info)
        )

        assert frame_id is None  # No contentDocument.frameId
        assert doc_url == 'https://fallback.example.com'
        assert parent_id == 'parent-frame-id'
        assert backend_id == 456

    def test_extract_with_base_url_fallback(self):
        """Test documentURL fallback to baseURL."""
        node_info = {
            'contentDocument': {
                'baseURL': 'https://base.example.com',
            },
            'backendNodeId': 789,
        }

        frame_id, doc_url, parent_id, backend_id = (
            IFrameContextResolver._extract_frame_metadata(node_info)
        )

        assert doc_url == 'https://base.example.com'

    def test_extract_empty_node_info(self):
        """Test extracting from empty node info."""
        node_info = {}

        frame_id, doc_url, parent_id, backend_id = (
            IFrameContextResolver._extract_frame_metadata(node_info)
        )

        assert frame_id is None
        assert doc_url is None
        assert parent_id is None
        assert backend_id is None


class TestWalkFrames:
    """Test _walk_frames static method."""

    def test_walk_frames_single_frame(self):
        """Test walking a tree with single frame."""
        frame_tree = {
            'frame': {'id': 'frame-1', 'url': 'https://example.com'},
            'childFrames': [],
        }

        frames = list(IFrameContextResolver._walk_frames(frame_tree))

        assert len(frames) == 1
        assert frames[0]['id'] == 'frame-1'

    def test_walk_frames_with_children(self):
        """Test walking a tree with child frames."""
        frame_tree = {
            'frame': {'id': 'parent-frame', 'url': 'https://parent.com'},
            'childFrames': [
                {
                    'frame': {'id': 'child-frame-1', 'url': 'https://child1.com'},
                    'childFrames': [],
                },
                {
                    'frame': {'id': 'child-frame-2', 'url': 'https://child2.com'},
                    'childFrames': [],
                },
            ],
        }

        frames = list(IFrameContextResolver._walk_frames(frame_tree))

        assert len(frames) == 3
        frame_ids = [f['id'] for f in frames]
        assert 'parent-frame' in frame_ids
        assert 'child-frame-1' in frame_ids
        assert 'child-frame-2' in frame_ids

    def test_walk_frames_nested_children(self):
        """Test walking deeply nested frame tree."""
        frame_tree = {
            'frame': {'id': 'level-0'},
            'childFrames': [
                {
                    'frame': {'id': 'level-1'},
                    'childFrames': [
                        {
                            'frame': {'id': 'level-2'},
                            'childFrames': [],
                        }
                    ],
                }
            ],
        }

        frames = list(IFrameContextResolver._walk_frames(frame_tree))

        assert len(frames) == 3
        frame_ids = [f['id'] for f in frames]
        assert 'level-0' in frame_ids
        assert 'level-1' in frame_ids
        assert 'level-2' in frame_ids

    def test_walk_frames_empty_tree(self):
        """Test walking empty frame tree."""
        frames = list(IFrameContextResolver._walk_frames(None))
        assert frames == []

    def test_walk_frames_no_child_frames_key(self):
        """Test walking frame tree with no childFrames key."""
        frame_tree = {
            'frame': {'id': 'single-frame'},
        }

        frames = list(IFrameContextResolver._walk_frames(frame_tree))

        assert len(frames) == 1
        assert frames[0]['id'] == 'single-frame'


class TestFindChildByParent:
    """Test _find_child_by_parent static method."""

    def test_find_direct_child(self):
        """Test finding direct child by parent ID."""
        frame_tree = {
            'frame': {'id': 'root'},
            'childFrames': [
                {
                    'frame': {'id': 'child-1', 'parentId': 'target-parent'},
                    'childFrames': [],
                },
            ],
        }

        result = IFrameContextResolver._find_child_by_parent(frame_tree, 'target-parent')

        assert result == 'child-1'

    def test_find_nested_child(self):
        """Test finding nested child by parent ID."""
        frame_tree = {
            'frame': {'id': 'root'},
            'childFrames': [
                {
                    'frame': {'id': 'level-1', 'parentId': 'root'},
                    'childFrames': [
                        {
                            'frame': {'id': 'level-2', 'parentId': 'target-parent'},
                            'childFrames': [],
                        }
                    ],
                }
            ],
        }

        result = IFrameContextResolver._find_child_by_parent(frame_tree, 'target-parent')

        assert result == 'level-2'

    def test_find_child_not_found(self):
        """Test when child with matching parent is not found."""
        frame_tree = {
            'frame': {'id': 'root'},
            'childFrames': [
                {
                    'frame': {'id': 'child', 'parentId': 'other-parent'},
                    'childFrames': [],
                }
            ],
        }

        result = IFrameContextResolver._find_child_by_parent(frame_tree, 'non-existent')

        assert result is None

    def test_find_child_empty_tree(self):
        """Test finding in empty tree."""
        result = IFrameContextResolver._find_child_by_parent(None, 'any-parent')

        assert result is None

    def test_find_child_no_child_frames(self):
        """Test finding in tree with no child frames."""
        frame_tree = {
            'frame': {'id': 'root'},
            'childFrames': [],
        }

        result = IFrameContextResolver._find_child_by_parent(frame_tree, 'any-parent')

        assert result is None


class TestGetFrameTreeFor:
    """Test _get_frame_tree_for static method."""

    @pytest.mark.asyncio
    async def test_get_frame_tree_without_session(self):
        """Test getting frame tree without session ID."""
        mock_handler = MagicMock()
        mock_handler.execute_command = AsyncMock(
            return_value={
                'result': {
                    'frameTree': {
                        'frame': {'id': 'main-frame'},
                        'childFrames': [],
                    }
                }
            }
        )

        result = await IFrameContextResolver._get_frame_tree_for(mock_handler, None)

        assert result['frame']['id'] == 'main-frame'
        # Verify command was called
        mock_handler.execute_command.assert_called_once()
        call_args = mock_handler.execute_command.call_args[0][0]
        assert 'sessionId' not in call_args

    @pytest.mark.asyncio
    async def test_get_frame_tree_with_session(self):
        """Test getting frame tree with session ID."""
        mock_handler = MagicMock()
        mock_handler.execute_command = AsyncMock(
            return_value={
                'result': {
                    'frameTree': {
                        'frame': {'id': 'session-frame'},
                        'childFrames': [],
                    }
                }
            }
        )

        result = await IFrameContextResolver._get_frame_tree_for(
            mock_handler, 'session-123'
        )

        assert result['frame']['id'] == 'session-frame'
        call_args = mock_handler.execute_command.call_args[0][0]
        assert call_args['sessionId'] == 'session-123'


class TestOwnerBackendFor:
    """Test _owner_backend_for static method."""

    @pytest.mark.asyncio
    async def test_owner_backend_without_session(self):
        """Test getting owner backend ID without session."""
        mock_handler = MagicMock()
        mock_handler.execute_command = AsyncMock(
            return_value={'result': {'backendNodeId': 456}}
        )

        result = await IFrameContextResolver._owner_backend_for(
            mock_handler, None, 'frame-id-123'
        )

        assert result == 456
        call_args = mock_handler.execute_command.call_args[0][0]
        assert 'sessionId' not in call_args

    @pytest.mark.asyncio
    async def test_owner_backend_with_session(self):
        """Test getting owner backend ID with session."""
        mock_handler = MagicMock()
        mock_handler.execute_command = AsyncMock(
            return_value={'result': {'backendNodeId': 789}}
        )

        result = await IFrameContextResolver._owner_backend_for(
            mock_handler, 'session-xyz', 'frame-id-456'
        )

        assert result == 789
        call_args = mock_handler.execute_command.call_args[0][0]
        assert call_args['sessionId'] == 'session-xyz'

    @pytest.mark.asyncio
    async def test_owner_backend_missing_result(self):
        """Test handling missing result."""
        mock_handler = MagicMock()
        mock_handler.execute_command = AsyncMock(return_value={})

        result = await IFrameContextResolver._owner_backend_for(
            mock_handler, None, 'frame-id'
        )

        assert result is None


class TestCreateIsolatedWorldForFrame:
    """Test _create_isolated_world_for_frame static method."""

    @pytest.mark.asyncio
    async def test_create_isolated_world_success(self):
        """Test successful creation of isolated world."""
        mock_handler = MagicMock()
        mock_handler.execute_command = AsyncMock(
            return_value={'result': {'executionContextId': 42}}
        )

        result = await IFrameContextResolver._create_isolated_world_for_frame(
            'frame-id-123', mock_handler, None
        )

        assert result == 42
        call_args = mock_handler.execute_command.call_args[0][0]
        assert 'sessionId' not in call_args
        assert 'pydoll::iframe::frame-id-123' in call_args['params']['worldName']

    @pytest.mark.asyncio
    async def test_create_isolated_world_with_session(self):
        """Test creation with session ID."""
        mock_handler = MagicMock()
        mock_handler.execute_command = AsyncMock(
            return_value={'result': {'executionContextId': 99}}
        )

        result = await IFrameContextResolver._create_isolated_world_for_frame(
            'frame-id', mock_handler, 'session-abc'
        )

        assert result == 99
        call_args = mock_handler.execute_command.call_args[0][0]
        assert call_args['sessionId'] == 'session-abc'

    @pytest.mark.asyncio
    async def test_create_isolated_world_failure(self):
        """Test failure when no execution context ID returned."""
        mock_handler = MagicMock()
        mock_handler.execute_command = AsyncMock(return_value={'result': {}})

        with pytest.raises(InvalidIFrame, match='Unable to create isolated world'):
            await IFrameContextResolver._create_isolated_world_for_frame(
                'frame-id', mock_handler, None
            )


class TestGetDocumentObjectId:
    """Test _get_document_object_id method."""

    @pytest.mark.asyncio
    async def test_get_document_object_id_success(self, resolver, mock_element):
        """Test successful retrieval of document object ID."""
        mock_element._connection_handler.execute_command.return_value = {
            'result': {'result': {'objectId': 'doc-object-123'}}
        }

        context = IFrameContext(frame_id='test-frame')

        result = await resolver._get_document_object_id(42, context)

        assert result == 'doc-object-123'

    @pytest.mark.asyncio
    async def test_get_document_object_id_with_session(self, resolver, mock_element):
        """Test retrieval with session handler."""
        mock_session_handler = MagicMock()
        mock_session_handler.execute_command = AsyncMock(
            return_value={'result': {'result': {'objectId': 'session-doc-obj'}}}
        )

        context = IFrameContext(
            frame_id='test-frame',
            session_handler=mock_session_handler,
            session_id='session-123',
        )

        result = await resolver._get_document_object_id(99, context)

        assert result == 'session-doc-obj'
        mock_session_handler.execute_command.assert_called_once()

    @pytest.mark.asyncio
    async def test_get_document_object_id_failure(self, resolver, mock_element):
        """Test failure when document object ID not found."""
        mock_element._connection_handler.execute_command.return_value = {
            'result': {'result': {}}
        }

        context = IFrameContext(frame_id='test-frame')

        with pytest.raises(InvalidIFrame, match='Unable to obtain document reference'):
            await resolver._get_document_object_id(42, context)


class TestResolveOopifIfNeeded:
    """Test _resolve_oopif_if_needed method."""

    @pytest.mark.asyncio
    async def test_returns_early_when_no_parent_frame(self, resolver):
        """Test early return when content_frame_id is None."""
        result = await resolver._resolve_oopif_if_needed(
            current_frame_id='frame-123',
            content_frame_id=None,
            backend_node_id=456,
            current_document_url='https://example.com',
        )

        handler, session_id, frame_id, url = result
        assert handler is None
        assert session_id is None
        assert frame_id == 'frame-123'
        assert url == 'https://example.com'

    @pytest.mark.asyncio
    async def test_returns_early_when_frame_resolved_without_backend(self, resolver):
        """Test early return when frame is resolved and no backend_node_id."""
        result = await resolver._resolve_oopif_if_needed(
            current_frame_id='resolved-frame',
            content_frame_id='parent-123',
            backend_node_id=None,
            current_document_url='https://resolved.com',
        )

        handler, session_id, frame_id, url = result
        assert handler is None
        assert session_id is None
        assert frame_id == 'resolved-frame'
        assert url == 'https://resolved.com'


class TestResolveFrameByOwner:
    """Test _resolve_frame_by_owner method."""

    @pytest.mark.asyncio
    async def test_resolve_returns_current_url_on_failure(self, resolver):
        """Test that current URL is preserved when resolution fails."""
        # Mock _find_frame_by_owner to return no match
        resolver._find_frame_by_owner = AsyncMock(return_value=(None, None))

        mock_handler = MagicMock()

        result = await resolver._resolve_frame_by_owner(
            mock_handler, None, 123, 'https://current.com'
        )

        frame_id, url = result
        assert frame_id is None
        assert url == 'https://current.com'

    @pytest.mark.asyncio
    async def test_resolve_returns_found_frame(self, resolver):
        """Test successful frame resolution by owner."""
        resolver._find_frame_by_owner = AsyncMock(
            return_value=('found-frame-id', 'https://found.com')
        )

        mock_handler = MagicMock()

        result = await resolver._resolve_frame_by_owner(
            mock_handler, None, 456, 'https://fallback.com'
        )

        frame_id, url = result
        assert frame_id == 'found-frame-id'
        assert url == 'https://found.com'

    @pytest.mark.asyncio
    async def test_resolve_uses_fallback_url(self, resolver):
        """Test URL fallback when found frame has no URL."""
        resolver._find_frame_by_owner = AsyncMock(
            return_value=('frame-id', None)
        )

        mock_handler = MagicMock()

        result = await resolver._resolve_frame_by_owner(
            mock_handler, None, 789, 'https://fallback.com'
        )

        frame_id, url = result
        assert frame_id == 'frame-id'
        assert url == 'https://fallback.com'


================================================
FILE: tests/test_interactions/test_keyboard.py
================================================
import pytest
import pytest_asyncio
from unittest.mock import AsyncMock, MagicMock

from pydoll.interactions.keyboard import Keyboard, KeyboardAPI
from pydoll.constants import Key
from pydoll.protocol.input.types import KeyEventType


@pytest_asyncio.fixture
async def mock_tab():
    """Mock Tab instance for KeyboardAPI tests."""
    tab = MagicMock()
    tab._execute_command = AsyncMock()
    tab.focus = AsyncMock()
    return tab


@pytest_asyncio.fixture
async def keyboard_api(mock_tab):
    """Create KeyboardAPI instance with mocked tab."""
    return KeyboardAPI(mock_tab)


class TestKeyboardAPIInitialization:
    """Test KeyboardAPI initialization."""

    def test_initialization(self, mock_tab):
        """Test KeyboardAPI is properly initialized with executor."""
        keyboard_api = KeyboardAPI(mock_tab)
        assert keyboard_api._executor == mock_tab


class TestKeyboardAPIDown:
    """Test keyboard.down() method."""

    @pytest.mark.asyncio
    async def test_key_down_without_modifiers(self, keyboard_api, mock_tab):
        """Test pressing key down without modifiers."""
        await keyboard_api.down(Key.A)

        # Verify execute_command was called
        assert mock_tab._execute_command.called
        call_args = mock_tab._execute_command.call_args
        command = call_args[0][0]

        # Verify the command structure
        assert command['method'] == 'Input.dispatchKeyEvent'
        assert command['params']['type'] == KeyEventType.KEY_DOWN
        assert command['params']['key'] == 'A'
        assert command['params']['windowsVirtualKeyCode'] == 65
        assert command['params']['nativeVirtualKeyCode'] == 65

    @pytest.mark.asyncio
    async def test_key_down_with_modifiers(self, keyboard_api, mock_tab):
        """Test pressing key down with modifiers."""
        await keyboard_api.down(Key.C, modifiers=2)  # Ctrl modifier

        call_args = mock_tab._execute_command.call_args
        command = call_args[0][0]

        assert command['params']['type'] == KeyEventType.KEY_DOWN
        assert command['params']['key'] == 'C'
        assert command['params']['modifiers'] == 2

    @pytest.mark.asyncio
    async def test_key_down_enter(self, keyboard_api, mock_tab):
        """Test pressing Enter key down."""
        await keyboard_api.down(Key.ENTER)

        call_args = mock_tab._execute_command.call_args
        command = call_args[0][0]

        assert command['params']['key'] == 'Enter'
        assert command['params']['windowsVirtualKeyCode'] == 13


class TestKeyboardAPIUp:
    """Test keyboard.up() method."""

    @pytest.mark.asyncio
    async def test_key_up(self, keyboard_api, mock_tab):
        """Test releasing a key."""
        await keyboard_api.up(Key.A)

        call_args = mock_tab._execute_command.call_args
        command = call_args[0][0]

        assert command['method'] == 'Input.dispatchKeyEvent'
        assert command['params']['type'] == KeyEventType.KEY_UP
        assert command['params']['key'] == 'A'
        assert command['params']['windowsVirtualKeyCode'] == 65

    @pytest.mark.asyncio
    async def test_key_up_shift(self, keyboard_api, mock_tab):
        """Test releasing Shift key."""
        await keyboard_api.up(Key.SHIFT)

        call_args = mock_tab._execute_command.call_args
        command = call_args[0][0]

        assert command['params']['key'] == 'Shift'
        assert command['params']['windowsVirtualKeyCode'] == 16


class TestKeyboardAPIPress:
    """Test keyboard.press() method."""

    @pytest.mark.asyncio
    async def test_press_key(self, keyboard_api, mock_tab):
        """Test pressing and releasing a key."""
        await keyboard_api.press(Key.ENTER)

        # Should call execute_command twice (down + up)
        assert mock_tab._execute_command.call_count == 2

        # Verify first call is KEY_DOWN
        first_call = mock_tab._execute_command.call_args_list[0]
        assert first_call[0][0]['params']['type'] == KeyEventType.KEY_DOWN

        # Verify second call is KEY_UP
        second_call = mock_tab._execute_command.call_args_list[1]
        assert second_call[0][0]['params']['type'] == KeyEventType.KEY_UP

    @pytest.mark.asyncio
    async def test_press_with_modifiers(self, keyboard_api, mock_tab):
        """Test pressing key with modifiers."""
        await keyboard_api.press(Key.S, modifiers=2)  # Ctrl+S

        # Verify KEY_DOWN has modifiers
        first_call = mock_tab._execute_command.call_args_list[0]
        assert first_call[0][0]['params']['modifiers'] == 2

    @pytest.mark.asyncio
    async def test_press_with_custom_interval(self, keyboard_api, mock_tab):
        """Test pressing key with custom hold interval."""
        # Just verify it completes without error
        await keyboard_api.press(Key.TAB, interval=0.2)
        assert mock_tab._execute_command.call_count == 2


class TestKeyboardAPIHotkey:
    """Test keyboard.hotkey() method."""

    @pytest.mark.asyncio
    async def test_hotkey_ctrl_c(self, keyboard_api, mock_tab):
        """Test Ctrl+C hotkey."""
        await keyboard_api.hotkey(Key.CONTROL, Key.C)

        # Should call execute_command twice (C down + up)
        assert mock_tab._execute_command.call_count == 2

        # Verify KEY_DOWN for C with Ctrl modifier
        first_call = mock_tab._execute_command.call_args_list[0]
        command = first_call[0][0]
        assert command['params']['type'] == KeyEventType.KEY_DOWN
        assert command['params']['key'] == 'C'
        assert command['params']['modifiers'] == 2  # Ctrl = 2

        # Verify KEY_UP for C
        second_call = mock_tab._execute_command.call_args_list[1]
        command = second_call[0][0]
        assert command['params']['type'] == KeyEventType.KEY_UP
        assert command['params']['key'] == 'C'

    @pytest.mark.asyncio
    async def test_hotkey_ctrl_shift_t(self, keyboard_api, mock_tab):
        """Test Ctrl+Shift+T hotkey (3 keys)."""
        await keyboard_api.hotkey(Key.CONTROL, Key.SHIFT, Key.T)

        # Should call execute_command twice (T down + up)
        assert mock_tab._execute_command.call_count == 2

        # Verify KEY_DOWN for T with Ctrl+Shift modifiers
        first_call = mock_tab._execute_command.call_args_list[0]
        command = first_call[0][0]
        assert command['params']['key'] == 'T'
        assert command['params']['modifiers'] == 10  # Ctrl(2) + Shift(8) = 10

        # Verify KEY_UP for T
        second_call = mock_tab._execute_command.call_args_list[1]
        command = second_call[0][0]
        assert command['params']['type'] == KeyEventType.KEY_UP

    @pytest.mark.asyncio
    async def test_hotkey_alt_f4(self, keyboard_api, mock_tab):
        """Test Alt+F4 hotkey."""
        await keyboard_api.hotkey(Key.ALT, Key.F4)

        first_call = mock_tab._execute_command.call_args_list[0]
        command = first_call[0][0]
        assert command['params']['key'] == 'F4'
        assert command['params']['modifiers'] == 1  # Alt = 1

    @pytest.mark.asyncio
    async def test_hotkey_shift_a(self, keyboard_api, mock_tab):
        """Test Shift+A hotkey (uppercase A)."""
        await keyboard_api.hotkey(Key.SHIFT, Key.A)

        first_call = mock_tab._execute_command.call_args_list[0]
        command = first_call[0][0]
        assert command['params']['key'] == 'A'
        assert command['params']['modifiers'] == 8  # Shift = 8


class TestKeyboardAPISplitModifiers:
    """Test _split_modifiers_and_keys static method."""

    def test_split_single_modifier_and_key(self):
        """Test splitting Ctrl+C."""
        keys = [Key.CONTROL, Key.C]
        modifiers, non_modifiers = KeyboardAPI._split_modifiers_and_keys(keys)

        assert modifiers == [Key.CONTROL]
        assert non_modifiers == [Key.C]

    def test_split_multiple_modifiers_and_key(self):
        """Test splitting Ctrl+Shift+T."""
        keys = [Key.CONTROL, Key.SHIFT, Key.T]
        modifiers, non_modifiers = KeyboardAPI._split_modifiers_and_keys(keys)

        assert set(modifiers) == {Key.CONTROL, Key.SHIFT}
        assert non_modifiers == [Key.T]

    def test_split_no_modifiers(self):
        """Test splitting when no modifiers present."""
        keys = [Key.A, Key.B]
        modifiers, non_modifiers = KeyboardAPI._split_modifiers_and_keys(keys)

        assert modifiers == []
        assert set(non_modifiers) == {Key.A, Key.B}

    def test_split_only_modifiers(self):
        """Test splitting when only modifiers present."""
        keys = [Key.CONTROL, Key.SHIFT]
        modifiers, non_modifiers = KeyboardAPI._split_modifiers_and_keys(keys)

        assert set(modifiers) == {Key.CONTROL, Key.SHIFT}
        assert non_modifiers == []


class TestKeyboardAPICalculateModifier:
    """Test _calculate_modifier_value static method."""

    def test_calculate_single_modifier_ctrl(self):
        """Test calculating Ctrl modifier value."""
        modifiers = [Key.CONTROL]
        value = KeyboardAPI._calculate_modifier_value(modifiers)
        assert value == 2

    def test_calculate_single_modifier_shift(self):
        """Test calculating Shift modifier value."""
        modifiers = [Key.SHIFT]
        value = KeyboardAPI._calculate_modifier_value(modifiers)
        assert value == 8

    def test_calculate_single_modifier_alt(self):
        """Test calculating Alt modifier value."""
        modifiers = [Key.ALT]
        value = KeyboardAPI._calculate_modifier_value(modifiers)
        assert value == 1

    def test_calculate_single_modifier_meta(self):
        """Test calculating Meta modifier value."""
        modifiers = [Key.META]
        value = KeyboardAPI._calculate_modifier_value(modifiers)
        assert value == 4

    def test_calculate_ctrl_shift(self):
        """Test calculating Ctrl+Shift modifier value."""
        modifiers = [Key.CONTROL, Key.SHIFT]
        value = KeyboardAPI._calculate_modifier_value(modifiers)
        assert value == 10  # 2 + 8

    def test_calculate_ctrl_alt(self):
        """Test calculating Ctrl+Alt modifier value."""
        modifiers = [Key.CONTROL, Key.ALT]
        value = KeyboardAPI._calculate_modifier_value(modifiers)
        assert value == 3  # 2 + 1

    def test_calculate_all_modifiers(self):
        """Test calculating all modifiers together."""
        modifiers = [Key.CONTROL, Key.SHIFT, Key.ALT, Key.META]
        value = KeyboardAPI._calculate_modifier_value(modifiers)
        assert value == 15  # 2 + 8 + 1 + 4

    def test_calculate_no_modifiers(self):
        """Test calculating with no modifiers."""
        modifiers = []
        value = KeyboardAPI._calculate_modifier_value(modifiers)
        assert value is None


class TestKeyboardAPIIntegrationWithTab:
    """Test KeyboardAPI integration with Tab class."""

    @pytest.mark.asyncio
    async def test_keyboard_api_uses_tab_execute_command(self, mock_tab):
        """Test that KeyboardAPI uses tab's _execute_command."""
        keyboard_api = KeyboardAPI(mock_tab)
        await keyboard_api.down(Key.A)

        # Verify tab's _execute_command was called
        assert mock_tab._execute_command.called

    def test_keyboard_api_stores_executor_reference(self, mock_tab):
        """Test that KeyboardAPI stores reference to executor."""
        keyboard_api = KeyboardAPI(mock_tab)
        assert keyboard_api._executor is mock_tab


class TestKeyboardAPIEdgeCases:
    """Test edge cases and special scenarios."""

    @pytest.mark.asyncio
    async def test_press_numpad_key(self, keyboard_api, mock_tab):
        """Test pressing numpad keys."""
        await keyboard_api.press(Key.NUMPAD5)

        first_call = mock_tab._execute_command.call_args_list[0]
        command = first_call[0][0]
        assert command['params']['key'] == 'Numpad5'
        assert command['params']['windowsVirtualKeyCode'] == 101

    @pytest.mark.asyncio
    async def test_press_function_key(self, keyboard_api, mock_tab):
        """Test pressing function keys."""
        await keyboard_api.press(Key.F12)

        first_call = mock_tab._execute_command.call_args_list[0]
        command = first_call[0][0]
        assert command['params']['key'] == 'F12'
        assert command['params']['windowsVirtualKeyCode'] == 123

    @pytest.mark.asyncio
    async def test_hotkey_with_digit(self, keyboard_api, mock_tab):
        """Test hotkey with digit keys."""
        await keyboard_api.hotkey(Key.CONTROL, Key.DIGIT1)

        first_call = mock_tab._execute_command.call_args_list[0]
        command = first_call[0][0]
        assert command['params']['key'] == '1'
        assert command['params']['modifiers'] == 2

    @pytest.mark.asyncio
    async def test_sequential_key_presses(self, keyboard_api, mock_tab):
        """Test multiple sequential key presses."""
        await keyboard_api.press(Key.A)
        await keyboard_api.press(Key.B)
        await keyboard_api.press(Key.C)

        # Should be called 6 times (3 keys × 2 events each)
        assert mock_tab._execute_command.call_count == 6

        # Verify sequence: A down, A up, B down, B up, C down, C up
        calls = mock_tab._execute_command.call_args_list
        assert calls[0][0][0]['params']['key'] == 'A'
        assert calls[0][0][0]['params']['type'] == KeyEventType.KEY_DOWN
        assert calls[1][0][0]['params']['key'] == 'A'
        assert calls[1][0][0]['params']['type'] == KeyEventType.KEY_UP
        assert calls[2][0][0]['params']['key'] == 'B'
        assert calls[4][0][0]['params']['key'] == 'C'


class TestTimingConfig:
    """Test TimingConfig dataclass."""

    def test_default_values(self):
        """Test default timing configuration values."""
        from pydoll.interactions.keyboard import TimingConfig

        config = TimingConfig()

        assert config.keystroke_min == 0.03
        assert config.keystroke_max == 0.12
        assert config.punctuation_min == 0.08
        assert config.punctuation_max == 0.18
        assert config.thinking_probability == 0.02
        assert config.thinking_min == 0.3
        assert config.thinking_max == 0.7
        assert config.distraction_probability == 0.005
        assert config.distraction_min == 0.5
        assert config.distraction_max == 1.2
        assert config.mistake_realize_min == 0.1
        assert config.mistake_realize_max == 0.25
        assert config.after_correction_min == 0.03
        assert config.after_correction_max == 0.08
        assert config.double_press_min == 0.02
        assert config.double_press_max == 0.05
        assert config.hesitation_min == 0.15
        assert config.hesitation_max == 0.3

    def test_custom_values(self):
        """Test custom timing configuration values."""
        from pydoll.interactions.keyboard import TimingConfig

        config = TimingConfig(
            keystroke_min=0.05,
            keystroke_max=0.15,
            thinking_probability=0.1,
        )

        assert config.keystroke_min == 0.05
        assert config.keystroke_max == 0.15
        assert config.thinking_probability == 0.1

    def test_frozen_dataclass(self):
        """Test that config is immutable (frozen)."""
        from pydoll.interactions.keyboard import TimingConfig

        config = TimingConfig()

        with pytest.raises(AttributeError):
            config.keystroke_min = 1.0


class TestTypoConfig:
    """Test TypoConfig dataclass."""

    def test_default_values(self):
        """Test default typo configuration values."""
        from pydoll.interactions.keyboard import TypoConfig

        config = TypoConfig()

        assert config.adjacent_weight == 0.55
        assert config.transpose_weight == 0.20
        assert config.double_weight == 0.12
        assert config.skip_weight == 0.08
        assert config.missed_space_weight == 0.05

    def test_custom_values(self):
        """Test custom typo configuration values."""
        from pydoll.interactions.keyboard import TypoConfig

        config = TypoConfig(
            adjacent_weight=0.7,
            transpose_weight=0.1,
        )

        assert config.adjacent_weight == 0.7
        assert config.transpose_weight == 0.1

    def test_frozen_dataclass(self):
        """Test that config is immutable (frozen)."""
        from pydoll.interactions.keyboard import TypoConfig

        config = TypoConfig()

        with pytest.raises(AttributeError):
            config.adjacent_weight = 1.0


class TestTypoResult:
    """Test TypoResult dataclass."""

    def test_typo_result_creation(self):
        """Test creating TypoResult."""
        from pydoll.interactions.keyboard import TypoResult
        from pydoll.constants import TypoType

        result = TypoResult(typo_type=TypoType.ADJACENT, wrong_char='e')

        assert result.typo_type == TypoType.ADJACENT
        assert result.wrong_char == 'e'

    def test_typo_result_default_wrong_char(self):
        """Test TypoResult with default wrong_char."""
        from pydoll.interactions.keyboard import TypoResult
        from pydoll.constants import TypoType

        result = TypoResult(typo_type=TypoType.SKIP)

        assert result.typo_type == TypoType.SKIP
        assert result.wrong_char == ''


class TestKeyboardTypeText:
    """Test keyboard.type_text() method."""

    @pytest.mark.asyncio
    async def test_type_text_basic(self, keyboard_api, mock_tab):
        """Test basic text typing."""
        await keyboard_api.type_text("ab", humanize=False)

        # Should call execute_command for each character (KEY_DOWN + KEY_UP)
        assert mock_tab._execute_command.call_count == 4

        # Verify characters are typed (checking KEY_DOWN events)
        # Call 0: 'a' KEY_DOWN
        first_call = mock_tab._execute_command.call_args_list[0]
        assert first_call[0][0]['params']['text'] == 'a'
        assert first_call[0][0]['params']['type'] == KeyEventType.KEY_DOWN

        # Call 1: 'a' KEY_UP
        second_call = mock_tab._execute_command.call_args_list[1]
        assert second_call[0][0]['params']['type'] == KeyEventType.KEY_UP

        # Call 2: 'b' KEY_DOWN
        third_call = mock_tab._execute_command.call_args_list[2]
        assert third_call[0][0]['params']['text'] == 'b'
        assert third_call[0][0]['params']['type'] == KeyEventType.KEY_DOWN

    @pytest.mark.asyncio
    async def test_type_text_with_humanize_calls_humanized_method(self, mock_tab):
        """Test that humanize=True calls _type_text_humanized."""
        from pydoll.interactions.keyboard import Keyboard

        keyboard = Keyboard(mock_tab)
        keyboard._type_text_humanized = AsyncMock()

        await keyboard.type_text("test", humanize=True)

        keyboard._type_text_humanized.assert_called_once_with("test")

    @pytest.mark.asyncio
    async def test_type_text_interval_deprecated_warning(self, keyboard_api):
        """Test that interval parameter shows deprecation warning."""
        import warnings

        with warnings.catch_warnings(record=True) as w:
            warnings.simplefilter("always")
            await keyboard_api.type_text("a", interval=0.1)

            assert len(w) == 1
            assert issubclass(w[0].category, DeprecationWarning)
            assert "interval" in str(w[0].message)

    @pytest.mark.asyncio
    async def test_type_char_calls_focus(self, keyboard_api, mock_tab):
        """_type_char should call focus before dispatching key events."""
        await keyboard_api._type_char("x")

        mock_tab.focus.assert_called_once()

    @pytest.mark.asyncio
    async def test_type_backspace_calls_focus(self, keyboard_api, mock_tab):
        """_type_backspace should call focus before dispatching key events."""
        await keyboard_api._type_backspace()

        mock_tab.focus.assert_called_once()

    @pytest.mark.asyncio
    async def test_ensure_focus_skipped_without_focus_method(self):
        """Executor without focus method should not trigger focus calls."""
        executor = MagicMock(spec=['_execute_command'])
        executor._execute_command = AsyncMock()
        keyboard = Keyboard(executor)

        assert keyboard._has_focus is False
        await keyboard._type_char("a")
        # No error and no focus call attempted

    @pytest.mark.asyncio
    async def test_type_char(self, keyboard_api, mock_tab):
        """Test _type_char sends KEY_DOWN and KEY_UP with key info."""
        await keyboard_api._type_char("x")

        # Should call execute_command twice (down + up)
        assert mock_tab._execute_command.call_count == 2

        # Verify KEY_DOWN includes key, code and keycode
        first_call = mock_tab._execute_command.call_args_list[0]
        command_down = first_call[0][0]
        assert command_down['method'] == 'Input.dispatchKeyEvent'
        assert command_down['params']['type'] == KeyEventType.KEY_DOWN
        assert command_down['params']['text'] == 'x'
        assert command_down['params']['key'] == 'x'
        assert command_down['params']['code'] == 'KeyX'
        assert command_down['params']['windowsVirtualKeyCode'] == 88
        assert command_down['params']['nativeVirtualKeyCode'] == 88

        # Verify KEY_UP includes key, code and keycode
        second_call = mock_tab._execute_command.call_args_list[1]
        command_up = second_call[0][0]
        assert command_up['method'] == 'Input.dispatchKeyEvent'
        assert command_up['params']['type'] == KeyEventType.KEY_UP
        assert command_up['params']['key'] == 'x'
        assert command_up['params']['code'] == 'KeyX'
        assert command_up['params']['windowsVirtualKeyCode'] == 88

    @pytest.mark.asyncio
    async def test_type_char_uppercase(self, keyboard_api, mock_tab):
        """Test _type_char sends correct key info for uppercase letters."""
        await keyboard_api._type_char("A")

        command_down = mock_tab._execute_command.call_args_list[0][0][0]
        assert command_down['params']['text'] == 'A'
        assert command_down['params']['key'] == 'A'
        assert command_down['params']['code'] == 'KeyA'
        assert command_down['params']['windowsVirtualKeyCode'] == 65

    @pytest.mark.asyncio
    async def test_type_char_digit(self, keyboard_api, mock_tab):
        """Test _type_char sends correct key info for digits."""
        await keyboard_api._type_char("5")

        command_down = mock_tab._execute_command.call_args_list[0][0][0]
        assert command_down['params']['text'] == '5'
        assert command_down['params']['key'] == '5'
        assert command_down['params']['code'] == 'Digit5'
        assert command_down['params']['windowsVirtualKeyCode'] == 53

    @pytest.mark.asyncio
    async def test_type_char_symbol(self, keyboard_api, mock_tab):
        """Test _type_char sends correct key info for symbols."""
        await keyboard_api._type_char("@")

        command_down = mock_tab._execute_command.call_args_list[0][0][0]
        assert command_down['params']['text'] == '@'
        assert command_down['params']['key'] == '@'
        assert command_down['params']['code'] == 'Digit2'
        assert command_down['params']['windowsVirtualKeyCode'] == 50

    @pytest.mark.asyncio
    async def test_type_char_unmapped(self, keyboard_api, mock_tab):
        """Test _type_char falls back gracefully for unmapped characters."""
        await keyboard_api._type_char("\u00e9")  # é (accented)

        command_down = mock_tab._execute_command.call_args_list[0][0][0]
        assert command_down['params']['text'] == '\u00e9'
        assert command_down['params']['key'] == '\u00e9'
        assert command_down['params']['windowsVirtualKeyCode'] == 0

    @pytest.mark.asyncio
    @pytest.mark.parametrize(
        'char',
        list('abcdefghijklmnopqrstuvwxyz'
             'ABCDEFGHIJKLMNOPQRSTUVWXYZ'
             '0123456789'
             ' -=[]\\;\',./`'
             '!@#$%^&*()_+{}|:"<>?~'
             '\n\t'),
    )
    async def test_type_char_all_mapped_characters(self, mock_tab, char):
        """Every character in CHAR_TO_KEY_INFO should produce non-zero keycode."""
        from pydoll.constants import CHAR_TO_KEY_INFO

        keyboard = Keyboard(mock_tab)
        await keyboard._type_char(char)

        command_down = mock_tab._execute_command.call_args_list[0][0][0]
        expected_key, expected_code, expected_keycode = CHAR_TO_KEY_INFO[char]

        assert command_down['params']['text'] == char
        assert command_down['params']['key'] == expected_key
        assert command_down['params']['code'] == expected_code
        assert command_down['params']['windowsVirtualKeyCode'] == expected_keycode
        assert expected_keycode > 0, f'keycode for {char!r} should not be 0'

    @pytest.mark.asyncio
    async def test_type_backspace(self, keyboard_api, mock_tab):
        """Test _type_backspace sends backspace keys."""
        await keyboard_api._type_backspace()

        # Should call down + up for backspace
        assert mock_tab._execute_command.call_count == 2

        first_call = mock_tab._execute_command.call_args_list[0]
        assert first_call[0][0]['params']['key'] == 'Backspace'
        assert first_call[0][0]['params']['type'] == KeyEventType.KEY_DOWN

        second_call = mock_tab._execute_command.call_args_list[1]
        assert second_call[0][0]['params']['type'] == KeyEventType.KEY_UP


class TestKeyboardTypoGeneration:
    """Test typo generation methods."""

    def test_should_make_typo_returns_boolean(self):
        """Test _should_make_typo returns a boolean."""
        from pydoll.interactions.keyboard import Keyboard

        result = Keyboard._should_make_typo()
        assert isinstance(result, bool)

    def test_select_typo_type_returns_valid_type(self, keyboard_api):
        """Test _select_typo_type returns valid TypoType."""
        from pydoll.constants import TypoType

        valid_types = {
            TypoType.ADJACENT,
            TypoType.TRANSPOSE,
            TypoType.DOUBLE,
            TypoType.SKIP,
            TypoType.MISSED_SPACE,
        }

        for _ in range(10):
            result = keyboard_api._select_typo_type()
            assert result in valid_types

    def test_create_adjacent_typo_returns_adjacent_type(self):
        """Test _create_adjacent_typo returns ADJACENT type for valid char."""
        from pydoll.interactions.keyboard import Keyboard
        from pydoll.constants import TypoType

        result = Keyboard._create_adjacent_typo('a')

        # 'a' has neighbors, so should return ADJACENT
        assert result.typo_type == TypoType.ADJACENT
        assert result.wrong_char != ''

    def test_create_adjacent_typo_fallback_for_unknown_char(self):
        """Test _create_adjacent_typo falls back for unknown chars."""
        from pydoll.interactions.keyboard import Keyboard
        from pydoll.constants import TypoType

        # Using a character not in QWERTY_NEIGHBORS
        result = Keyboard._create_adjacent_typo('@')

        # Should fall back to DOUBLE
        assert result.typo_type == TypoType.DOUBLE
        assert result.wrong_char == '@'

    def test_create_adjacent_typo_preserves_case(self):
        """Test _create_adjacent_typo preserves character case."""
        from pydoll.interactions.keyboard import Keyboard

        # Uppercase should return uppercase neighbor
        result_upper = Keyboard._create_adjacent_typo('A')
        if result_upper.wrong_char:
            assert result_upper.wrong_char.isupper()

        # Lowercase should return lowercase neighbor
        result_lower = Keyboard._create_adjacent_typo('a')
        if result_lower.wrong_char:
            assert result_lower.wrong_char.islower()

    def test_create_transpose_typo(self, keyboard_api):
        """Test _create_transpose_typo returns TRANSPOSE type."""
        from pydoll.constants import TypoType

        result = keyboard_api._create_transpose_typo('a', 'b')

        assert result.typo_type == TypoType.TRANSPOSE
        assert result.wrong_char == 'b'

    def test_create_transpose_typo_fallback_no_next_char(self, keyboard_api):
        """Test _create_transpose_typo falls back when no next char."""
        from pydoll.constants import TypoType

        result = keyboard_api._create_transpose_typo('a', None)

        # Should fall back to ADJACENT
        assert result.typo_type == TypoType.ADJACENT

    def test_create_missed_space_typo(self, keyboard_api):
        """Test _create_missed_space_typo returns MISSED_SPACE type."""
        from pydoll.constants import TypoType

        result = keyboard_api._create_missed_space_typo(' ')

        assert result.typo_type == TypoType.MISSED_SPACE

    def test_create_missed_space_typo_fallback_non_space(self, keyboard_api):
        """Test _create_missed_space_typo falls back for non-space."""
        from pydoll.constants import TypoType

        result = keyboard_api._create_missed_space_typo('a')

        # Should fall back to ADJACENT
        assert result.typo_type == TypoType.ADJACENT

    def test_generate_typo_returns_typo_result(self, keyboard_api):
        """Test _generate_typo returns TypoResult."""
        from pydoll.interactions.keyboard import TypoResult

        result = keyboard_api._generate_typo('a', 'b')

        assert isinstance(result, TypoResult)

    def test_create_typo_with_all_types(self, keyboard_api):
        """Test _create_typo handles all TypoType values."""
        from pydoll.constants import TypoType
        from pydoll.interactions.keyboard import TypoResult

        for typo_type in TypoType:
            result = keyboard_api._create_typo(typo_type, 'a', 'b')
            assert isinstance(result, TypoResult)


class TestKeyboardTypoHandling:
    """Test typo handling methods."""

    @pytest.mark.asyncio
    async def test_do_adjacent_typo(self, keyboard_api, mock_tab):
        """Test _do_adjacent_typo types wrong char, backspaces, then correct."""
        await keyboard_api._do_adjacent_typo('a', 's')

        # Should type: 's' (wrong), backspace, 'a' (correct)
        # That's at least 3 key events (char, down, up, char)
        assert mock_tab._execute_command.call_count >= 3

    @pytest.mark.asyncio
    async def test_do_transpose_typo(self, keyboard_api, mock_tab):
        """Test _do_transpose_typo types chars in wrong order then fixes."""
        await keyboard_api._do_transpose_typo('a', 'b')

        # Should type: 'b', 'a', backspace×2, 'a', 'b'
        # Multiple key events expected
        assert mock_tab._execute_command.call_count >= 4

    @pytest.mark.asyncio
    async def test_do_double_typo(self, keyboard_api, mock_tab):
        """Test _do_double_typo types char twice then backspaces."""
        await keyboard_api._do_double_typo('a')

        # Should type: 'a', 'a', backspace
        assert mock_tab._execute_command.call_count >= 3

    @pytest.mark.asyncio
    async def test_do_skip_typo(self, keyboard_api, mock_tab):
        """Test _do_skip_typo hesitates then types normally."""
        await keyboard_api._do_skip_typo('a')

        # Should just type 'a' (KEY_DOWN + KEY_UP)
        assert mock_tab._execute_command.call_count == 2
        
        # Verify KEY_DOWN
        first_call = mock_tab._execute_command.call_args_list[0]
        assert first_call[0][0]['params']['text'] == 'a'
        assert first_call[0][0]['params']['type'] == KeyEventType.KEY_DOWN

    @pytest.mark.asyncio
    async def test_do_missed_space_typo(self, keyboard_api, mock_tab):
        """Test _do_missed_space_typo misses space, fixes, types both."""
        await keyboard_api._do_missed_space_typo(' ', 'w')

        # Should type: 'w', backspace, ' ', 'w'
        assert mock_tab._execute_command.call_count >= 4

    @pytest.mark.asyncio
    async def test_handle_typo_adjacent(self, keyboard_api, mock_tab):
        """Test _handle_typo with ADJACENT type."""
        from pydoll.interactions.keyboard import TypoResult
        from pydoll.constants import TypoType

        typo = TypoResult(typo_type=TypoType.ADJACENT, wrong_char='s')
        result = await keyboard_api._handle_typo('a', 'b', typo)

        assert result is False  # Should not skip next
        assert mock_tab._execute_command.call_count >= 1

    @pytest.mark.asyncio
    async def test_handle_typo_transpose_skips_next(self, keyboard_api, mock_tab):
        """Test _handle_typo with TRANSPOSE type returns True."""
        from pydoll.interactions.keyboard import TypoResult
        from pydoll.constants import TypoType

        typo = TypoResult(typo_type=TypoType.TRANSPOSE, wrong_char='b')
        result = await keyboard_api._handle_typo('a', 'b', typo)

        assert result is True  # Should skip next

    @pytest.mark.asyncio
    async def test_handle_typo_double(self, keyboard_api, mock_tab):
        """Test _handle_typo with DOUBLE type."""
        from pydoll.interactions.keyboard import TypoResult
        from pydoll.constants import TypoType

        typo = TypoResult(typo_type=TypoType.DOUBLE, wrong_char='a')
        result = await keyboard_api._handle_typo('a', 'b', typo)

        assert result is False

    @pytest.mark.asyncio
    async def test_handle_typo_skip(self, keyboard_api, mock_tab):
        """Test _handle_typo with SKIP type."""
        from pydoll.interactions.keyboard import TypoResult
        from pydoll.constants import TypoType

        typo = TypoResult(typo_type=TypoType.SKIP)
        result = await keyboard_api._handle_typo('a', 'b', typo)

        assert result is False

    @pytest.mark.asyncio
    async def test_handle_typo_missed_space_skips_next(self, keyboard_api, mock_tab):
        """Test _handle_typo with MISSED_SPACE type returns True."""
        from pydoll.interactions.keyboard import TypoResult
        from pydoll.constants import TypoType

        typo = TypoResult(typo_type=TypoType.MISSED_SPACE)
        result = await keyboard_api._handle_typo(' ', 'w', typo)

        assert result is True  # Should skip next


class TestKeyboardRealisticDelay:
    """Test realistic delay application."""

    @pytest.mark.asyncio
    async def test_apply_realistic_delay_basic(self, keyboard_api):
        """Test _apply_realistic_delay doesn't raise."""
        # Just ensure it completes without error
        await keyboard_api._apply_realistic_delay('a')

    @pytest.mark.asyncio
    async def test_apply_realistic_delay_with_punctuation(self, keyboard_api):
        """Test _apply_realistic_delay adds extra delay for punctuation."""
        # Just ensure it completes without error for punctuation
        for char in ' .,!?;:\n':
            await keyboard_api._apply_realistic_delay(char)

    def test_pause_chars_constant(self):
        """Test PAUSE_CHARS is properly defined."""
        from pydoll.interactions.keyboard import Keyboard

        assert ' ' in Keyboard.PAUSE_CHARS
        assert '.' in Keyboard.PAUSE_CHARS
        assert ',' in Keyboard.PAUSE_CHARS
        assert '!' in Keyboard.PAUSE_CHARS
        assert '?' in Keyboard.PAUSE_CHARS
        assert ';' in Keyboard.PAUSE_CHARS
        assert ':' in Keyboard.PAUSE_CHARS
        assert '\n' in Keyboard.PAUSE_CHARS


class TestKeyboardWithCustomConfig:
    """Test Keyboard with custom configurations."""

    def test_keyboard_with_custom_timing(self, mock_tab):
        """Test Keyboard accepts custom timing configuration."""
        from pydoll.interactions.keyboard import Keyboard, TimingConfig

        custom_timing = TimingConfig(
            keystroke_min=0.1,
            keystroke_max=0.2,
        )

        keyboard = Keyboard(mock_tab, timing=custom_timing)

        assert keyboard._timing == custom_timing
        assert keyboard._timing.keystroke_min == 0.1

    def test_keyboard_with_custom_typo_config(self, mock_tab):
        """Test Keyboard accepts custom typo configuration."""
        from pydoll.interactions.keyboard import Keyboard, TypoConfig

        custom_typo = TypoConfig(
            adjacent_weight=0.9,
            transpose_weight=0.1,
        )

        keyboard = Keyboard(mock_tab, typo_config=custom_typo)

        assert keyboard._typo_config == custom_typo
        assert keyboard._typo_config.adjacent_weight == 0.9

    def test_keyboard_uses_default_configs(self, mock_tab):
        """Test Keyboard uses default configs if none provided."""
        from pydoll.interactions.keyboard import Keyboard

        keyboard = Keyboard(mock_tab)

        assert keyboard._timing.keystroke_min == 0.03
        assert keyboard._typo_config.adjacent_weight == 0.55


class TestKeyboardProcessCharWithTypo:
    """Test _process_char_with_typo method."""

    @pytest.mark.asyncio
    async def test_process_char_no_typo(self, mock_tab):
        """Test _process_char_with_typo when no typo occurs."""
        from pydoll.interactions.keyboard import Keyboard
        from unittest.mock import patch

        keyboard = Keyboard(mock_tab)

        # Patch _should_make_typo to always return False
        with patch.object(keyboard, '_should_make_typo', return_value=False):
            result = await keyboard._process_char_with_typo('a', 'b')

        assert result is False  # Should not skip next
        assert mock_tab._execute_command.call_count == 2

    @pytest.mark.asyncio
    async def test_process_char_with_typo(self, mock_tab):
        """Test _process_char_with_typo when typo occurs."""
        from pydoll.interactions.keyboard import Keyboard, TypoResult
        from pydoll.constants import TypoType
        from unittest.mock import patch

        keyboard = Keyboard(mock_tab)

        # Patch _should_make_typo to always return True
        # And _generate_typo to return a SKIP typo (simplest case)
        with patch.object(keyboard, '_should_make_typo', return_value=True):
            with patch.object(
                keyboard,
                '_generate_typo',
                return_value=TypoResult(typo_type=TypoType.SKIP),
            ):
                result = await keyboard._process_char_with_typo('a', 'b')

        assert result is False  # SKIP doesn't skip next


class TestKeyboardAPIBackwardCompatibility:
    """Test backward compatibility alias."""

    def test_keyboard_api_alias(self):
        """Test KeyboardAPI is an alias for Keyboard."""
        from pydoll.interactions.keyboard import Keyboard, KeyboardAPI

        assert KeyboardAPI is Keyboard


================================================
FILE: tests/test_interactions/test_mouse.py
================================================
import math

import pytest
import pytest_asyncio
from unittest.mock import AsyncMock, MagicMock, patch

from pydoll.interactions.mouse import Mouse, MouseAPI, MouseTimingConfig
from pydoll.interactions.utils import (
    bezier_2d,
    fitts_duration,
    minimum_jerk,
    random_control_points,
)
from pydoll.protocol.input.types import MouseButton, MouseEventType


@pytest_asyncio.fixture
async def mock_tab():
    """Mock Tab instance for Mouse tests."""
    tab = MagicMock()
    tab._execute_command = AsyncMock()
    return tab


@pytest_asyncio.fixture
async def mouse(mock_tab):
    """Create Mouse instance with mocked tab."""
    return Mouse(mock_tab)


# ── MouseTimingConfig ──────────────────────────────────────────────────


class TestMouseTimingConfig:
    """Test MouseTimingConfig dataclass."""

    def test_default_values(self):
        config = MouseTimingConfig()
        assert config.fitts_a == 0.070
        assert config.fitts_b == 0.150
        assert config.frame_interval == 0.012
        assert config.frame_interval_variance == 0.004
        assert config.curvature_min == 0.10
        assert config.curvature_max == 0.30
        assert config.curvature_asymmetry == 0.6
        assert config.short_distance_threshold == 50.0
        assert config.tremor_amplitude == 1.0
        assert config.overshoot_probability == 0.70
        assert config.overshoot_distance_min == 0.03
        assert config.overshoot_distance_max == 0.12
        assert config.overshoot_speed_threshold == 200.0
        assert config.pre_click_pause_min == 0.05
        assert config.pre_click_pause_max == 0.20
        assert config.click_hold_min == 0.05
        assert config.click_hold_max == 0.15
        assert config.double_click_interval_min == 0.05
        assert config.double_click_interval_max == 0.10
        assert config.drag_start_pause_min == 0.08
        assert config.drag_start_pause_max == 0.20
        assert config.drag_end_pause_min == 0.05
        assert config.drag_end_pause_max == 0.15
        assert config.micro_pause_probability == 0.03
        assert config.micro_pause_min == 0.015
        assert config.micro_pause_max == 0.04
        assert config.min_duration == 0.08
        assert config.max_duration == 2.5

    def test_custom_values(self):
        config = MouseTimingConfig(fitts_a=0.1, fitts_b=0.2, tremor_amplitude=2.0)
        assert config.fitts_a == 0.1
        assert config.fitts_b == 0.2
        assert config.tremor_amplitude == 2.0

    def test_frozen_dataclass(self):
        config = MouseTimingConfig()
        with pytest.raises(AttributeError):
            config.fitts_a = 1.0


# ── Mouse Initialization ──────────────────────────────────────────────


class TestMouseInitialization:
    """Test Mouse initialization."""

    def test_initialization(self, mock_tab):
        mouse = Mouse(mock_tab)
        assert mouse._tab == mock_tab
        assert isinstance(mouse._timing, MouseTimingConfig)
        assert mouse._position == (0.0, 0.0)

    def test_initialization_with_custom_timing(self, mock_tab):
        config = MouseTimingConfig(fitts_a=0.1)
        mouse = Mouse(mock_tab, timing=config)
        assert mouse._timing.fitts_a == 0.1

    def test_timing_property_getter(self, mock_tab):
        config = MouseTimingConfig(fitts_a=0.2)
        mouse = Mouse(mock_tab, timing=config)
        assert mouse.timing is config
        assert mouse.timing.fitts_a == 0.2

    def test_timing_property_setter(self, mock_tab):
        mouse = Mouse(mock_tab)
        default_timing = mouse.timing
        new_config = MouseTimingConfig(fitts_a=0.5, tremor_amplitude=2.0)
        mouse.timing = new_config
        assert mouse.timing is new_config
        assert mouse.timing is not default_timing
        assert mouse.timing.fitts_a == 0.5
        assert mouse.timing.tremor_amplitude == 2.0

    def test_initial_position_is_origin(self, mock_tab):
        mouse = Mouse(mock_tab)
        assert mouse._position == (0.0, 0.0)


# ── Mouse.move() ──────────────────────────────────────────────────────


class TestMouseMove:
    """Test Mouse.move() method."""

    @pytest.mark.asyncio
    async def test_move_dispatches_mouse_moved(self, mouse, mock_tab):
        await mouse.move(100, 200, humanize=False)

        assert mock_tab._execute_command.called
        command = mock_tab._execute_command.call_args[0][0]
        assert command['method'] == 'Input.dispatchMouseEvent'
        assert command['params']['type'] == MouseEventType.MOUSE_MOVED
        assert command['params']['x'] == 100
        assert command['params']['y'] == 200

    @pytest.mark.asyncio
    async def test_move_updates_position(self, mouse):
        await mouse.move(150, 250, humanize=False)
        assert mouse._position == (150, 250)

    @pytest.mark.asyncio
    async def test_move_rounds_float_coordinates(self, mouse, mock_tab):
        await mouse.move(99.7, 200.3, humanize=False)

        command = mock_tab._execute_command.call_args[0][0]
        assert command['params']['x'] == 100
        assert command['params']['y'] == 200

    @pytest.mark.asyncio
    async def test_move_single_event_when_not_humanized(self, mouse, mock_tab):
        await mouse.move(100, 200, humanize=False)
        assert mock_tab._execute_command.call_count == 1

    @pytest.mark.asyncio
    async def test_move_humanize_delegates_to_humanized(self, mouse):
        with patch.object(mouse, '_move_humanized', new_callable=AsyncMock) as mock_method:
            await mouse.move(100, 200, humanize=True)
            mock_method.assert_called_once_with(100, 200)


# ── Mouse.click() ─────────────────────────────────────────────────────


class TestMouseClick:
    """Test Mouse.click() method."""

    @pytest.mark.asyncio
    async def test_click_dispatches_move_press_release(self, mouse, mock_tab):
        await mouse.click(300, 400, humanize=False)

        # 3 calls: move + pressed + released
        assert mock_tab._execute_command.call_count == 3

        commands = [call[0][0] for call in mock_tab._execute_command.call_args_list]
        assert commands[0]['params']['type'] == MouseEventType.MOUSE_MOVED
        assert commands[1]['params']['type'] == MouseEventType.MOUSE_PRESSED
        assert commands[2]['params']['type'] == MouseEventType.MOUSE_RELEASED

    @pytest.mark.asyncio
    async def test_click_left_button_default(self, mouse, mock_tab):
        await mouse.click(300, 400, humanize=False)

        commands = [call[0][0] for call in mock_tab._execute_command.call_args_list]
        assert commands[1]['params']['button'] == MouseButton.LEFT
        assert commands[2]['params']['button'] == MouseButton.LEFT

    @pytest.mark.asyncio
    async def test_click_right_button(self, mouse, mock_tab):
        await mouse.click(300, 400, button=MouseButton.RIGHT, humanize=False)

        commands = [call[0][0] for call in mock_tab._execute_command.call_args_list]
        assert commands[1]['params']['button'] == MouseButton.RIGHT

    @pytest.mark.asyncio
    async def test_click_with_click_count(self, mouse, mock_tab):
        await mouse.click(300, 400, click_count=2, humanize=False)

        commands = [call[0][0] for call in mock_tab._execute_command.call_args_list]
        assert commands[1]['params']['clickCount'] == 2
        assert commands[2]['params']['clickCount'] == 2

    @pytest.mark.asyncio
    async def test_click_updates_position(self, mouse):
        await mouse.click(300, 400, humanize=False)
        assert mouse._position == (300, 400)

    @pytest.mark.asyncio
    async def test_click_position_in_press_release(self, mouse, mock_tab):
        await mouse.click(300, 400, humanize=False)

        commands = [call[0][0] for call in mock_tab._execute_command.call_args_list]
        assert commands[1]['params']['x'] == 300
        assert commands[1]['params']['y'] == 400
        assert commands[2]['params']['x'] == 300
        assert commands[2]['params']['y'] == 400

    @pytest.mark.asyncio
    async def test_click_humanize_delegates(self, mouse):
        with patch.object(mouse, '_click_humanized', new_callable=AsyncMock) as mock_method:
            await mouse.click(300, 400, humanize=True)
            mock_method.assert_called_once_with(300, 400, MouseButton.LEFT, 1)


# ── Mouse.double_click() ──────────────────────────────────────────────


class TestMouseDoubleClick:
    """Test Mouse.double_click() method."""

    @pytest.mark.asyncio
    async def test_double_click_delegates_to_click(self, mouse):
        with patch.object(mouse, 'click', new_callable=AsyncMock) as mock_click:
            await mouse.double_click(500, 600)
            mock_click.assert_called_once_with(
                500, 600, button=MouseButton.LEFT, click_count=2, humanize=False
            )

    @pytest.mark.asyncio
    async def test_double_click_right_button(self, mouse):
        with patch.object(mouse, 'click', new_callable=AsyncMock) as mock_click:
            await mouse.double_click(500, 600, button=MouseButton.RIGHT)
            mock_click.assert_called_once_with(
                500, 600, button=MouseButton.RIGHT, click_count=2, humanize=False
            )

    @pytest.mark.asyncio
    async def test_double_click_humanized(self, mouse):
        with patch.object(mouse, 'click', new_callable=AsyncMock) as mock_click:
            await mouse.double_click(500, 600, humanize=True)
            mock_click.assert_called_once_with(
                500, 600, button=MouseButton.LEFT, click_count=2, humanize=True
            )


# ── Mouse.down() ──────────────────────────────────────────────────────


class TestMouseDown:
    """Test Mouse.down() method."""

    @pytest.mark.asyncio
    async def test_down_dispatches_mouse_pressed(self, mouse, mock_tab):
        await mouse.down()

        command = mock_tab._execute_command.call_args[0][0]
        assert command['params']['type'] == MouseEventType.MOUSE_PRESSED
        assert command['params']['button'] == MouseButton.LEFT

    @pytest.mark.asyncio
    async def test_down_at_current_position(self, mouse, mock_tab):
        mouse._position = (100.0, 200.0)
        await mouse.down()

        command = mock_tab._execute_command.call_args[0][0]
        assert command['params']['x'] == 100
        assert command['params']['y'] == 200

    @pytest.mark.asyncio
    async def test_down_with_right_button(self, mouse, mock_tab):
        await mouse.down(button=MouseButton.RIGHT)

        command = mock_tab._execute_command.call_args[0][0]
        assert command['params']['button'] == MouseButton.RIGHT


# ── Mouse.up() ────────────────────────────────────────────────────────


class TestMouseUp:
    """Test Mouse.up() method."""

    @pytest.mark.asyncio
    async def test_up_dispatches_mouse_released(self, mouse, mock_tab):
        await mouse.up()

        command = mock_tab._execute_command.call_args[0][0]
        assert command['params']['type'] == MouseEventType.MOUSE_RELEASED
        assert command['params']['button'] == MouseButton.LEFT

    @pytest.mark.asyncio
    async def test_up_at_current_position(self, mouse, mock_tab):
        mouse._position = (100.0, 200.0)
        await mouse.up()

        command = mock_tab._execute_command.call_args[0][0]
        assert command['params']['x'] == 100
        assert command['params']['y'] == 200

    @pytest.mark.asyncio
    async def test_up_with_right_button(self, mouse, mock_tab):
        await mouse.up(button=MouseButton.RIGHT)

        command = mock_tab._execute_command.call_args[0][0]
        assert command['params']['button'] == MouseButton.RIGHT


# ── Mouse.drag() ──────────────────────────────────────────────────────


class TestMouseDrag:
    """Test Mouse.drag() method."""

    @pytest.mark.asyncio
    async def test_drag_dispatches_correct_sequence(self, mouse, mock_tab):
        await mouse.drag(100, 200, 500, 600, humanize=False)

        assert mock_tab._execute_command.call_count == 4
        commands = [call[0][0] for call in mock_tab._execute_command.call_args_list]

        # move to start, press, move to end, release
        assert commands[0]['params']['type'] == MouseEventType.MOUSE_MOVED
        assert commands[0]['params']['x'] == 100
        assert commands[0]['params']['y'] == 200
        assert commands[1]['params']['type'] == MouseEventType.MOUSE_PRESSED
        assert commands[2]['params']['type'] == MouseEventType.MOUSE_MOVED
        assert commands[2]['params']['x'] == 500
        assert commands[2]['params']['y'] == 600
        assert commands[3]['params']['type'] == MouseEventType.MOUSE_RELEASED

    @pytest.mark.asyncio
    async def test_drag_updates_position_to_end(self, mouse):
        await mouse.drag(100, 200, 500, 600, humanize=False)
        assert mouse._position == (500, 600)

    @pytest.mark.asyncio
    async def test_drag_uses_left_button(self, mouse, mock_tab):
        await mouse.drag(100, 200, 500, 600, humanize=False)

        commands = [call[0][0] for call in mock_tab._execute_command.call_args_list]
        assert commands[1]['params']['button'] == MouseButton.LEFT
        assert commands[3]['params']['button'] == MouseButton.LEFT

    @pytest.mark.asyncio
    async def test_drag_humanize_delegates(self, mouse):
        with patch.object(mouse, '_drag_humanized', new_callable=AsyncMock) as mock_method:
            await mouse.drag(100, 200, 500, 600, humanize=True)
            mock_method.assert_called_once_with(100, 200, 500, 600)


# ── Helper Functions ──────────────────────────────────────────────────


class TestMinimumJerk:
    """Test minimum_jerk function."""

    def test_at_zero(self):
        assert minimum_jerk(0.0) == pytest.approx(0.0)

    def test_at_one(self):
        assert minimum_jerk(1.0) == pytest.approx(1.0)

    def test_at_half(self):
        result = minimum_jerk(0.5)
        assert result == pytest.approx(0.5, abs=0.01)

    def test_monotonic(self):
        values = [minimum_jerk(t / 100.0) for t in range(101)]
        for i in range(len(values) - 1):
            assert values[i + 1] >= values[i]

    def test_stays_in_range(self):
        for t in [i / 20.0 for i in range(21)]:
            result = minimum_jerk(t)
            assert 0.0 <= result <= 1.0


class TestBezier2D:
    """Test bezier_2d function."""

    def test_at_t_zero_returns_p0(self):
        result = bezier_2d(0.0, (0, 0), (1, 1), (2, 2), (3, 3))
        assert result == pytest.approx((0, 0))

    def test_at_t_one_returns_p3(self):
        result = bezier_2d(1.0, (0, 0), (1, 1), (2, 2), (3, 3))
        assert result == pytest.approx((3, 3))

    def test_straight_line_midpoint(self):
        result = bezier_2d(0.5, (0, 0), (1, 0), (2, 0), (3, 0))
        assert result[0] == pytest.approx(1.5, abs=0.01)
        assert result[1] == pytest.approx(0.0, abs=0.01)

    def test_curved_path(self):
        result = bezier_2d(0.5, (0, 0), (0, 10), (10, 10), (10, 0))
        assert 0 < result[0] < 10
        assert result[1] > 0


class TestFittsDuration:
    """Test fitts_duration function."""

    def test_zero_distance(self):
        result = fitts_duration(0, 20, 0.07, 0.15)
        assert result == 0.07

    def test_negative_distance(self):
        result = fitts_duration(-10, 20, 0.07, 0.15)
        assert result == 0.07

    def test_increases_with_distance(self):
        d1 = fitts_duration(100, 20, 0.07, 0.15)
        d2 = fitts_duration(500, 20, 0.07, 0.15)
        assert d2 > d1

    def test_decreases_with_target_width(self):
        d1 = fitts_duration(200, 10, 0.07, 0.15)
        d2 = fitts_duration(200, 50, 0.07, 0.15)
        assert d1 > d2

    def test_known_value(self):
        # D=400, W=20: log2(400/20 + 1) = log2(21) ≈ 4.39
        result = fitts_duration(400, 20, 0.07, 0.15)
        expected = 0.07 + 0.15 * math.log2(21)
        assert result == pytest.approx(expected)


class TestRandomControlPoints:
    """Test random_control_points function."""

    def _call(self, start, end, config=None):
        config = config or MouseTimingConfig()
        return random_control_points(
            start, end,
            config.curvature_min, config.curvature_max,
            config.curvature_asymmetry, config.short_distance_threshold,
        )

    def test_returns_two_points(self):
        cp1, cp2 = self._call((0, 0), (100, 0))
        assert len(cp1) == 2
        assert len(cp2) == 2

    def test_short_distance_returns_start_end(self):
        result = self._call((0, 0), (0.5, 0))
        assert result == ((0, 0), (0.5, 0))

    def test_control_points_not_on_line(self):
        results = []
        for _ in range(20):
            cp1, cp2 = self._call((0, 0), (500, 0))
            results.append(abs(cp1[1]) > 0 or abs(cp2[1]) > 0)
        assert any(results)

    def test_short_distance_reduced_curvature(self):
        short_offsets = []
        long_offsets = []
        for _ in range(50):
            cp1_short, _ = self._call((0, 0), (20, 0))
            cp1_long, _ = self._call((0, 0), (500, 0))
            short_offsets.append(abs(cp1_short[1]))
            long_offsets.append(abs(cp1_long[1]))
        avg_short = sum(short_offsets) / len(short_offsets)
        avg_long = sum(long_offsets) / len(long_offsets)
        assert avg_short < avg_long


# ── Tremor Computation ────────────────────────────────────────────────


class TestComputeTremorSigma:
    """Test Mouse._compute_tremor_sigma static method."""

    def test_zero_dt_returns_full_amplitude(self):
        config = MouseTimingConfig(tremor_amplitude=2.0)
        sigma = Mouse._compute_tremor_sigma(10, 20, 1.0, (5, 10, 1.0), config)
        assert sigma == 2.0

    def test_high_velocity_reduces_tremor(self):
        config = MouseTimingConfig(tremor_amplitude=1.0)
        # High velocity: distance=100px in dt=0.01s -> velocity=10000
        sigma = Mouse._compute_tremor_sigma(100, 0, 1.01, (0, 0, 1.0), config)
        assert sigma == pytest.approx(0.2)  # min speed_factor

    def test_low_velocity_high_tremor(self):
        config = MouseTimingConfig(tremor_amplitude=1.0)
        # Low velocity: distance=1px in dt=0.1s -> velocity=10
        sigma = Mouse._compute_tremor_sigma(1, 0, 1.1, (0, 0, 1.0), config)
        assert sigma > 0.9


# ── Humanized Move ────────────────────────────────────────────────────


class TestMouseHumanizedMove:
    """Test Mouse._move_humanized method."""

    @pytest.mark.asyncio
    async def test_short_distance_single_dispatch(self, mouse, mock_tab):
        mouse._position = (100, 100)
        await mouse._move_humanized(100.5, 100.5)
        assert mock_tab._execute_command.call_count == 1

    @pytest.mark.asyncio
    async def test_dispatches_multiple_events(self, mouse, mock_tab):
        # Use fast timing to reduce test runtime
        mouse._timing = MouseTimingConfig(
            min_duration=0.02,
            max_duration=0.05,
            frame_interval=0.005,
            overshoot_probability=0.0,
            micro_pause_probability=0.0,
        )
        mouse._position = (0, 0)
        await mouse._move_humanized(500, 500)
        # Should have dispatched multiple mouseMoved events
        assert mock_tab._execute_command.call_count > 2

    @pytest.mark.asyncio
    async def test_final_position_is_target(self, mouse, mock_tab):
        mouse._timing = MouseTimingConfig(
            min_duration=0.02,
            max_duration=0.05,
            frame_interval=0.005,
            overshoot_probability=0.0,
            micro_pause_probability=0.0,
        )
        await mouse._move_humanized(300, 400)
        assert mouse._position == (300, 400)

    @pytest.mark.asyncio
    async def test_all_events_are_mouse_moved(self, mouse, mock_tab):
        mouse._timing = MouseTimingConfig(
            min_duration=0.02,
            max_duration=0.05,
            frame_interval=0.005,
            overshoot_probability=0.0,
            micro_pause_probability=0.0,
        )
        await mouse._move_humanized(200, 200)
        for call_item in mock_tab._execute_command.call_args_list:
            command = call_item[0][0]
            assert command['params']['type'] == MouseEventType.MOUSE_MOVED

    @pytest.mark.asyncio
    async def test_longer_distance_more_events(self, mouse, mock_tab):
        mouse._timing = MouseTimingConfig(
            min_duration=0.02,
            max_duration=0.5,
            frame_interval=0.005,
            overshoot_probability=0.0,
            micro_pause_probability=0.0,
        )
        await mouse._move_humanized(50, 50)
        short_count = mock_tab._execute_command.call_count

        mock_tab._execute_command.reset_mock()
        mouse._position = (0, 0)
        await mouse._move_humanized(800, 800)
        long_count = mock_tab._execute_command.call_count

        assert long_count > short_count

    @pytest.mark.asyncio
    async def test_overshoot_moves_past_target(self, mouse, mock_tab):
        mouse._timing = MouseTimingConfig(
            min_duration=0.05,
            max_duration=0.10,
            frame_interval=0.005,
            overshoot_probability=1.0,
            overshoot_speed_threshold=0,
            overshoot_distance_min=0.10,
            overshoot_distance_max=0.15,
            micro_pause_probability=0.0,
        )
        await mouse._move_humanized(500, 0)

        x_coords = [
            call[0][0]['params']['x']
            for call in mock_tab._execute_command.call_args_list
        ]
        assert max(x_coords) > 500


# ── Humanized Click ───────────────────────────────────────────────────


class TestMouseHumanizedClick:
    """Test Mouse._click_humanized method."""

    @pytest.mark.asyncio
    async def test_includes_move_press_release(self, mouse, mock_tab):
        mouse._timing = MouseTimingConfig(
            min_duration=0.01,
            max_duration=0.02,
            frame_interval=0.005,
            overshoot_probability=0.0,
            micro_pause_probability=0.0,
            pre_click_pause_min=0.001,
            pre_click_pause_max=0.001,
            click_hold_min=0.001,
            click_hold_max=0.001,
        )
        await mouse._click_humanized(300, 400, MouseButton.LEFT, 1)

        event_types = [
            call[0][0]['params']['type']
            for call in mock_tab._execute_command.call_args_list
        ]
        # Should contain: multiple MOUSE_MOVED, then MOUSE_PRESSED, then MOUSE_RELEASED
        assert MouseEventType.MOUSE_PRESSED in event_types
        assert MouseEventType.MOUSE_RELEASED in event_types
        moved_count = event_types.count(MouseEventType.MOUSE_MOVED)
        assert moved_count >= 1

    @pytest.mark.asyncio
    async def test_double_click_has_two_press_release_pairs(self, mouse, mock_tab):
        mouse._timing = MouseTimingConfig(
            min_duration=0.01,
            max_duration=0.02,
            frame_interval=0.005,
            overshoot_probability=0.0,
            micro_pause_probability=0.0,
            pre_click_pause_min=0.001,
            pre_click_pause_max=0.001,
            click_hold_min=0.001,
            click_hold_max=0.001,
            double_click_interval_min=0.001,
            double_click_interval_max=0.001,
        )
        await mouse._click_humanized(300, 400, MouseButton.LEFT, 2)

        event_types = [
            call[0][0]['params']['type']
            for call in mock_tab._execute_command.call_args_list
        ]
        assert event_types.count(MouseEventType.MOUSE_PRESSED) == 2
        assert event_types.count(MouseEventType.MOUSE_RELEASED) == 2

    @pytest.mark.asyncio
    async def test_click_count_in_commands(self, mouse, mock_tab):
        mouse._timing = MouseTimingConfig(
            min_duration=0.01,
            max_duration=0.02,
            frame_interval=0.005,
            overshoot_probability=0.0,
            micro_pause_probability=0.0,
            pre_click_pause_min=0.001,
            pre_click_pause_max=0.001,
            click_hold_min=0.001,
            click_hold_max=0.001,
            double_click_interval_min=0.001,
            double_click_interval_max=0.001,
        )
        await mouse._click_humanized(300, 400, MouseButton.LEFT, 2)

        press_commands = [
            call[0][0] for call in mock_tab._execute_command.call_args_list
            if call[0][0]['params']['type'] == MouseEventType.MOUSE_PRESSED
        ]
        assert press_commands[0]['params']['clickCount'] == 1
        assert press_commands[1]['params']['clickCount'] == 2

    @pytest.mark.asyncio
    async def test_click_lands_at_exact_position(self, mouse, mock_tab):
        mouse._timing = MouseTimingConfig(
            min_duration=0.01,
            max_duration=0.02,
            frame_interval=0.005,
            overshoot_probability=0.0,
            micro_pause_probability=0.0,
            pre_click_pause_min=0.001,
            pre_click_pause_max=0.001,
            click_hold_min=0.001,
            click_hold_max=0.001,
        )
        await mouse._click_humanized(300, 400, MouseButton.LEFT, 1)

        press_commands = [
            call[0][0] for call in mock_tab._execute_command.call_args_list
            if call[0][0]['params']['type'] == MouseEventType.MOUSE_PRESSED
        ]
        # Click must land at the exact target position
        assert press_commands[0]['params']['x'] == 300
        assert press_commands[0]['params']['y'] == 400


# ── Humanized Drag ────────────────────────────────────────────────────


class TestMouseHumanizedDrag:
    """Test Mouse._drag_humanized method."""

    @pytest.mark.asyncio
    async def test_drag_includes_press_and_release(self, mouse, mock_tab):
        mouse._timing = MouseTimingConfig(
            min_duration=0.01,
            max_duration=0.02,
            frame_interval=0.005,
            overshoot_probability=0.0,
            micro_pause_probability=0.0,
            drag_start_pause_min=0.001,
            drag_start_pause_max=0.001,
            drag_end_pause_min=0.001,
            drag_end_pause_max=0.001,
        )
        await mouse._drag_humanized(100, 200, 500, 600)

        event_types = [
            call[0][0]['params']['type']
            for call in mock_tab._execute_command.call_args_list
        ]
        assert MouseEventType.MOUSE_PRESSED in event_types
        assert MouseEventType.MOUSE_RELEASED in event_types
        assert event_types.count(MouseEventType.MOUSE_MOVED) >= 2

    @pytest.mark.asyncio
    async def test_drag_ends_at_target(self, mouse, mock_tab):
        mouse._timing = MouseTimingConfig(
            min_duration=0.01,
            max_duration=0.02,
            frame_interval=0.005,
            overshoot_probability=0.0,
            micro_pause_probability=0.0,
            drag_start_pause_min=0.001,
            drag_start_pause_max=0.001,
            drag_end_pause_min=0.001,
            drag_end_pause_max=0.001,
        )
        await mouse._drag_humanized(100, 200, 500, 600)
        assert mouse._position == (500, 600)

    @pytest.mark.asyncio
    async def test_drag_press_before_release(self, mouse, mock_tab):
        mouse._timing = MouseTimingConfig(
            min_duration=0.01,
            max_duration=0.02,
            frame_interval=0.005,
            overshoot_probability=0.0,
            micro_pause_probability=0.0,
            drag_start_pause_min=0.001,
            drag_start_pause_max=0.001,
            drag_end_pause_min=0.001,
            drag_end_pause_max=0.001,
        )
        await mouse._drag_humanized(100, 200, 500, 600)

        event_types = [
            call[0][0]['params']['type']
            for call in mock_tab._execute_command.call_args_list
        ]
        press_idx = event_types.index(MouseEventType.MOUSE_PRESSED)
        release_idx = len(event_types) - 1 - event_types[::-1].index(MouseEventType.MOUSE_RELEASED)
        assert press_idx < release_idx


# ── Dispatch Helpers ──────────────────────────────────────────────────


class TestDispatchMove:
    """Test Mouse._dispatch_move method."""

    @pytest.mark.asyncio
    async def test_dispatches_correct_command(self, mouse, mock_tab):
        await mouse._dispatch_move(150.7, 250.3)

        command = mock_tab._execute_command.call_args[0][0]
        assert command['method'] == 'Input.dispatchMouseEvent'
        assert command['params']['type'] == MouseEventType.MOUSE_MOVED
        assert command['params']['x'] == 151
        assert command['params']['y'] == 250

    @pytest.mark.asyncio
    async def test_updates_position_with_float(self, mouse):
        await mouse._dispatch_move(150.7, 250.3)
        assert mouse._position == (150.7, 250.3)


class TestDispatchButton:
    """Test Mouse._dispatch_button method."""

    @pytest.mark.asyncio
    async def test_dispatches_pressed(self, mouse, mock_tab):
        mouse._position = (100.0, 200.0)
        await mouse._dispatch_button(MouseEventType.MOUSE_PRESSED, MouseButton.LEFT, 1)

        command = mock_tab._execute_command.call_args[0][0]
        assert command['params']['type'] == MouseEventType.MOUSE_PRESSED
        assert command['params']['button'] == MouseButton.LEFT
        assert command['params']['clickCount'] == 1
        assert command['params']['x'] == 100
        assert command['params']['y'] == 200

    @pytest.mark.asyncio
    async def test_dispatches_released(self, mouse, mock_tab):
        mouse._position = (100.0, 200.0)
        await mouse._dispatch_button(MouseEventType.MOUSE_RELEASED, MouseButton.LEFT)

        command = mock_tab._execute_command.call_args[0][0]
        assert command['params']['type'] == MouseEventType.MOUSE_RELEASED


# ── Backward Compatibility ────────────────────────────────────────────


class TestMouseAPIAlias:
    """Test MouseAPI backward compatibility alias."""

    def test_mouse_api_is_mouse(self):
        assert MouseAPI is Mouse


# ── Tab Integration ───────────────────────────────────────────────────


class TestTabMouseProperty:
    """Test tab.mouse lazy property."""

    def test_tab_mouse_property_exists(self):
        from pydoll.browser.tab import Tab
        assert hasattr(Tab, 'mouse')

    def test_tab_mouse_returns_mouse_api(self):
        from pydoll.interactions import MouseAPI
        tab = MagicMock()
        tab._execute_command = AsyncMock()
        tab._mouse = None
        # Access the property descriptor directly
        mouse_obj = MouseAPI(tab)
        assert isinstance(mouse_obj, MouseAPI)


================================================
FILE: tests/test_interactions/test_scroll.py
================================================
import pytest
import pytest_asyncio
from unittest.mock import AsyncMock, MagicMock, patch, call

from pydoll.interactions.scroll import ScrollAPI
from pydoll.constants import ScrollPosition, Scripts
from pydoll.commands import RuntimeCommands


@pytest_asyncio.fixture
async def mock_tab():
    """Mock Tab instance for ScrollAPI tests."""
    tab = MagicMock()
    tab._execute_command = AsyncMock()
    return tab


@pytest_asyncio.fixture
async def scroll_api(mock_tab):
    """Create ScrollAPI instance with mocked tab."""
    return ScrollAPI(mock_tab)


class TestScrollAPIInitialization:
    """Test ScrollAPI initialization."""

    def test_initialization(self, mock_tab):
        """Test ScrollAPI is properly initialized with tab."""
        scroll_api = ScrollAPI(mock_tab)
        assert scroll_api._tab == mock_tab


class TestScrollAPIBy:
    """Test scroll.by() method."""

    @pytest.mark.asyncio
    async def test_scroll_down_smooth(self, scroll_api, mock_tab):
        """Test scrolling down with smooth animation."""
        await scroll_api.by(ScrollPosition.DOWN, 500, smooth=True, humanize=False)

        # Verify execute_command was called
        assert mock_tab._execute_command.called
        call_args = mock_tab._execute_command.call_args

        # Verify the command is RuntimeCommands.evaluate with await_promise=True
        command = call_args[0][0]
        assert command['method'] == 'Runtime.evaluate'
        assert command['params']['awaitPromise'] is True

        # Verify the script contains expected values
        script = command['params']['expression']
        assert 'top: 500' in script
        assert "behavior: 'smooth'" in script

    @pytest.mark.asyncio
    async def test_scroll_up_smooth(self, scroll_api, mock_tab):
        """Test scrolling up with smooth animation."""
        await scroll_api.by(ScrollPosition.UP, 300, smooth=True, humanize=False)

        call_args = mock_tab._execute_command.call_args
        command = call_args[0][0]
        script = command['params']['expression']

        assert 'top: -300' in script
        assert "behavior: 'smooth'" in script

    @pytest.mark.asyncio
    async def test_scroll_right_smooth(self, scroll_api, mock_tab):
        """Test scrolling right with smooth animation."""
        await scroll_api.by(ScrollPosition.RIGHT, 200, smooth=True, humanize=False)

        call_args = mock_tab._execute_command.call_args
        command = call_args[0][0]
        script = command['params']['expression']

        assert 'left: 200' in script
        assert "behavior: 'smooth'" in script

    @pytest.mark.asyncio
    async def test_scroll_left_smooth(self, scroll_api, mock_tab):
        """Test scrolling left with smooth animation."""
        await scroll_api.by(ScrollPosition.LEFT, 150, smooth=True, humanize=False)

        call_args = mock_tab._execute_command.call_args
        command = call_args[0][0]
        script = command['params']['expression']

        assert 'left: -150' in script
        assert "behavior: 'smooth'" in script

    @pytest.mark.asyncio
    async def test_scroll_down_instant(self, scroll_api, mock_tab):
        """Test scrolling down without smooth animation."""
        await scroll_api.by(ScrollPosition.DOWN, 1000, smooth=False, humanize=False)

        call_args = mock_tab._execute_command.call_args
        command = call_args[0][0]
        script = command['params']['expression']

        assert 'top: 1000' in script
        assert "behavior: 'auto'" in script

    @pytest.mark.asyncio
    async def test_scroll_with_float_distance(self, scroll_api, mock_tab):
        """Test scrolling with float distance."""
        await scroll_api.by(ScrollPosition.DOWN, 250.5, smooth=True, humanize=False)

        call_args = mock_tab._execute_command.call_args
        command = call_args[0][0]
        script = command['params']['expression']

        assert 'top: 250.5' in script


class TestScrollAPIToTop:
    """Test scroll.to_top() method."""

    @pytest.mark.asyncio
    async def test_scroll_to_top_smooth(self, scroll_api, mock_tab):
        """Test scrolling to top with smooth animation."""
        await scroll_api.to_top(smooth=True, humanize=False)

        assert mock_tab._execute_command.called
        call_args = mock_tab._execute_command.call_args
        command = call_args[0][0]

        assert command['method'] == 'Runtime.evaluate'
        assert command['params']['awaitPromise'] is True

        script = command['params']['expression']
        assert 'top: 0' in script
        assert "behavior: 'smooth'" in script

    @pytest.mark.asyncio
    async def test_scroll_to_top_instant(self, scroll_api, mock_tab):
        """Test scrolling to top without smooth animation."""
        await scroll_api.to_top(smooth=False, humanize=False)

        call_args = mock_tab._execute_command.call_args
        command = call_args[0][0]
        script = command['params']['expression']

        assert 'top: 0' in script
        assert "behavior: 'auto'" in script


class TestScrollAPIToBottom:
    """Test scroll.to_bottom() method."""

    @pytest.mark.asyncio
    async def test_scroll_to_bottom_smooth(self, scroll_api, mock_tab):
        """Test scrolling to bottom with smooth animation."""
        await scroll_api.to_bottom(smooth=True, humanize=False)

        assert mock_tab._execute_command.called
        call_args = mock_tab._execute_command.call_args
        command = call_args[0][0]

        assert command['method'] == 'Runtime.evaluate'
        assert command['params']['awaitPromise'] is True

        script = command['params']['expression']
        assert 'top: document.body.scrollHeight' in script
        assert "behavior: 'smooth'" in script

    @pytest.mark.asyncio
    async def test_scroll_to_bottom_instant(self, scroll_api, mock_tab):
        """Test scrolling to bottom without smooth animation."""
        await scroll_api.to_bottom(smooth=False, humanize=False)

        call_args = mock_tab._execute_command.call_args
        command = call_args[0][0]
        script = command['params']['expression']

        assert 'top: document.body.scrollHeight' in script
        assert "behavior: 'auto'" in script


class TestScrollAPIHelperMethods:
    """Test ScrollAPI private helper methods."""

    def test_get_axis_and_distance_down(self, scroll_api):
        """Test _get_axis_and_distance for DOWN direction."""
        axis, distance = scroll_api._get_axis_and_distance(ScrollPosition.DOWN, 100)
        assert axis == 'top'
        assert distance == 100

    def test_get_axis_and_distance_up(self, scroll_api):
        """Test _get_axis_and_distance for UP direction."""
        axis, distance = scroll_api._get_axis_and_distance(ScrollPosition.UP, 100)
        assert axis == 'top'
        assert distance == -100

    def test_get_axis_and_distance_right(self, scroll_api):
        """Test _get_axis_and_distance for RIGHT direction."""
        axis, distance = scroll_api._get_axis_and_distance(ScrollPosition.RIGHT, 50)
        assert axis == 'left'
        assert distance == 50

    def test_get_axis_and_distance_left(self, scroll_api):
        """Test _get_axis_and_distance for LEFT direction."""
        axis, distance = scroll_api._get_axis_and_distance(ScrollPosition.LEFT, 50)
        assert axis == 'left'
        assert distance == -50

    def test_get_behavior_smooth(self, scroll_api):
        """Test _get_behavior with smooth=True."""
        behavior = scroll_api._get_behavior(True)
        assert behavior == 'smooth'

    def test_get_behavior_instant(self, scroll_api):
        """Test _get_behavior with smooth=False."""
        behavior = scroll_api._get_behavior(False)
        assert behavior == 'auto'


class TestScrollAPIIntegrationWithTab:
    """Test ScrollAPI integration with Tab."""

    @pytest.mark.asyncio
    async def test_tab_has_scroll_property(self):
        """Test that Tab has scroll property."""
        with patch('pydoll.connection.ConnectionHandler', autospec=True):
            from pydoll.browser.tab import Tab

            mock_browser = MagicMock()
            tab = Tab(mock_browser, target_id='test-id')

            # Access scroll property
            scroll = tab.scroll

            # Verify it's a ScrollAPI instance
            assert isinstance(scroll, ScrollAPI)
            assert scroll._tab == tab

    @pytest.mark.asyncio
    async def test_tab_scroll_property_is_lazy(self):
        """Test that scroll property is created lazily."""
        with patch('pydoll.connection.ConnectionHandler', autospec=True):
            from pydoll.browser.tab import Tab

            mock_browser = MagicMock()
            tab = Tab(mock_browser, target_id='test-id')

            # Initially None
            assert tab._scroll is None

            # Access creates instance
            scroll1 = tab.scroll
            assert tab._scroll is not None

            # Second access returns same instance
            scroll2 = tab.scroll
            assert scroll1 is scroll2

    @pytest.mark.asyncio
    async def test_scroll_execute_command_integration(self):
        """Test that scroll methods properly call tab._execute_command."""
        with patch('pydoll.connection.ConnectionHandler', autospec=True):
            from pydoll.browser.tab import Tab

            mock_browser = MagicMock()
            tab = Tab(mock_browser, target_id='test-id')
            tab._execute_command = AsyncMock()

            # Call scroll method
            await tab.scroll.by(ScrollPosition.DOWN, 500, smooth=True, humanize=False)

            # Verify _execute_command was called
            assert tab._execute_command.called

            # Verify command structure
            call_args = tab._execute_command.call_args
            command = call_args[0][0]
            assert command['method'] == 'Runtime.evaluate'
            assert command['params']['awaitPromise'] is True


class TestScrollAPIScriptGeneration:
    """Test that correct JavaScript scripts are generated."""

    @pytest.mark.asyncio
    async def test_scroll_by_script_structure(self, scroll_api, mock_tab):
        """Test that scroll.by generates correct script structure."""
        await scroll_api.by(ScrollPosition.DOWN, 500, smooth=True, humanize=False)

        call_args = mock_tab._execute_command.call_args
        command = call_args[0][0]
        script = command['params']['expression']

        # Verify script has Promise structure
        assert 'new Promise' in script or 'Promise' in script
        assert 'scrollend' in script or 'scrollBy' in script
        assert 'resolve' in script

    @pytest.mark.asyncio
    async def test_to_top_script_structure(self, scroll_api, mock_tab):
        """Test that scroll.to_top generates correct script structure."""
        await scroll_api.to_top(smooth=True, humanize=False)

        call_args = mock_tab._execute_command.call_args
        command = call_args[0][0]
        script = command['params']['expression']

        # Verify script has Promise structure and scrollTo
        assert 'new Promise' in script or 'Promise' in script
        assert 'scrollTo' in script
        assert 'top: 0' in script

    @pytest.mark.asyncio
    async def test_to_bottom_script_structure(self, scroll_api, mock_tab):
        """Test that scroll.to_bottom generates correct script structure."""
        await scroll_api.to_bottom(smooth=True, humanize=False)

        call_args = mock_tab._execute_command.call_args
        command = call_args[0][0]
        script = command['params']['expression']

        # Verify script has Promise structure and scrollHeight
        assert 'new Promise' in script or 'Promise' in script
        assert 'scrollTo' in script
        assert 'scrollHeight' in script


class TestScrollAPIAwaitPromise:
    """Test that awaitPromise parameter is correctly set."""

    @pytest.mark.asyncio
    async def test_scroll_by_uses_await_promise(self, scroll_api, mock_tab):
        """Test that scroll.by uses awaitPromise parameter."""
        await scroll_api.by(ScrollPosition.DOWN, 100, smooth=True, humanize=False)

        call_args = mock_tab._execute_command.call_args
        command = call_args[0][0]

        # Verify awaitPromise is True
        assert command['params']['awaitPromise'] is True

    @pytest.mark.asyncio
    async def test_to_top_uses_await_promise(self, scroll_api, mock_tab):
        """Test that scroll.to_top uses awaitPromise parameter."""
        await scroll_api.to_top(smooth=True, humanize=False)

        call_args = mock_tab._execute_command.call_args
        command = call_args[0][0]

        assert command['params']['awaitPromise'] is True

    @pytest.mark.asyncio
    async def test_to_bottom_uses_await_promise(self, scroll_api, mock_tab):
        """Test that scroll.to_bottom uses awaitPromise parameter."""
        await scroll_api.to_bottom(smooth=True, humanize=False)

        call_args = mock_tab._execute_command.call_args
        command = call_args[0][0]

        assert command['params']['awaitPromise'] is True


class TestScrollTimingConfig:
    """Test ScrollTimingConfig dataclass."""

    def test_default_values(self):
        """Test default configuration values."""
        from pydoll.interactions.scroll import ScrollTimingConfig

        config = ScrollTimingConfig()

        assert config.min_duration == 0.5
        assert config.max_duration == 1.5
        assert config.bezier_points == (0.645, 0.045, 0.355, 1.0)
        assert config.frame_interval == 0.012
        assert config.delta_jitter == 3
        assert config.micro_pause_probability == 0.05
        assert config.micro_pause_min == 0.02
        assert config.micro_pause_max == 0.05
        assert config.overshoot_probability == 0.15
        assert config.overshoot_factor_min == 1.02
        assert config.overshoot_factor_max == 1.08

    def test_custom_values(self):
        """Test custom configuration values."""
        from pydoll.interactions.scroll import ScrollTimingConfig

        config = ScrollTimingConfig(
            min_duration=0.3,
            max_duration=2.0,
            bezier_points=(0.5, 0.0, 0.5, 1.0),
            frame_interval=0.016,
            delta_jitter=5,
            micro_pause_probability=0.1,
            overshoot_probability=0.2,
        )

        assert config.min_duration == 0.3
        assert config.max_duration == 2.0
        assert config.bezier_points == (0.5, 0.0, 0.5, 1.0)
        assert config.frame_interval == 0.016
        assert config.delta_jitter == 5
        assert config.micro_pause_probability == 0.1
        assert config.overshoot_probability == 0.2

    def test_frozen_dataclass(self):
        """Test that config is immutable (frozen)."""
        from pydoll.interactions.scroll import ScrollTimingConfig

        config = ScrollTimingConfig()

        with pytest.raises(AttributeError):
            config.min_duration = 1.0


class TestCubicBezier:
    """Test CubicBezier curve solver."""

    def test_initialization(self):
        """Test CubicBezier initialization with control points."""
        from pydoll.interactions.scroll import CubicBezier

        bezier = CubicBezier(0.25, 0.1, 0.25, 1.0)

        # Verify coefficients are calculated
        assert hasattr(bezier, 'coefficient_a_x')
        assert hasattr(bezier, 'coefficient_b_x')
        assert hasattr(bezier, 'coefficient_c_x')
        assert hasattr(bezier, 'coefficient_a_y')
        assert hasattr(bezier, 'coefficient_b_y')
        assert hasattr(bezier, 'coefficient_c_y')

    def test_sample_curve_x_at_zero(self):
        """Test sample_curve_x returns 0 at t=0."""
        from pydoll.interactions.scroll import CubicBezier

        bezier = CubicBezier(0.25, 0.1, 0.25, 1.0)

        assert bezier.sample_curve_x(0.0) == 0.0

    def test_sample_curve_x_at_one(self):
        """Test sample_curve_x returns 1 at t=1."""
        from pydoll.interactions.scroll import CubicBezier

        bezier = CubicBezier(0.25, 0.1, 0.25, 1.0)

        assert abs(bezier.sample_curve_x(1.0) - 1.0) < 1e-10

    def test_sample_curve_y_at_zero(self):
        """Test sample_curve_y returns 0 at t=0."""
        from pydoll.interactions.scroll import CubicBezier

        bezier = CubicBezier(0.25, 0.1, 0.25, 1.0)

        assert bezier.sample_curve_y(0.0) == 0.0

    def test_sample_curve_y_at_one(self):
        """Test sample_curve_y returns 1 at t=1."""
        from pydoll.interactions.scroll import CubicBezier

        bezier = CubicBezier(0.25, 0.1, 0.25, 1.0)

        assert abs(bezier.sample_curve_y(1.0) - 1.0) < 1e-10

    def test_sample_curve_derivative_x(self):
        """Test sample_curve_derivative_x returns derivative."""
        from pydoll.interactions.scroll import CubicBezier

        bezier = CubicBezier(0.25, 0.1, 0.25, 1.0)

        # Derivative at t=0 should equal coefficient_c_x
        assert bezier.sample_curve_derivative_x(0.0) == bezier.coefficient_c_x

    def test_solve_curve_x_finds_t_for_x(self):
        """Test solve_curve_x finds t value for given x."""
        from pydoll.interactions.scroll import CubicBezier

        bezier = CubicBezier(0.25, 0.1, 0.25, 1.0)

        # For x=0, t should be 0
        assert abs(bezier.solve_curve_x(0.0)) < 1e-6

        # For x=1, t should be 1
        assert abs(bezier.solve_curve_x(1.0) - 1.0) < 1e-6

    def test_solve_returns_y_for_given_x(self):
        """Test solve returns y value for given x (time)."""
        from pydoll.interactions.scroll import CubicBezier

        bezier = CubicBezier(0.25, 0.1, 0.25, 1.0)

        # At x=0, y should be 0
        assert abs(bezier.solve(0.0)) < 1e-6

        # At x=1, y should be 1
        assert abs(bezier.solve(1.0) - 1.0) < 1e-6

    def test_solve_returns_values_between_0_and_1(self):
        """Test solve returns values in valid range for valid inputs."""
        from pydoll.interactions.scroll import CubicBezier

        bezier = CubicBezier(0.645, 0.045, 0.355, 1.0)

        for x in [0.1, 0.25, 0.5, 0.75, 0.9]:
            y = bezier.solve(x)
            assert 0.0 <= y <= 1.0, f"y={y} out of range for x={x}"

    def test_solve_curve_x_with_out_of_range_values(self):
        """Test solve_curve_x behavior with out of range values."""
        from pydoll.interactions.scroll import CubicBezier

        bezier = CubicBezier(0.25, 0.1, 0.25, 1.0)

        # Newton's method will try to find t even for out-of-range x values
        # Just verify it returns a numeric result without crashing
        result_negative = bezier.solve_curve_x(-0.5)
        assert isinstance(result_negative, float)

        result_over_one = bezier.solve_curve_x(1.5)
        assert isinstance(result_over_one, float)

    def test_ease_in_out_bezier(self):
        """Test standard ease-in-out bezier curve."""
        from pydoll.interactions.scroll import CubicBezier

        # Standard CSS ease-in-out
        bezier = CubicBezier(0.42, 0.0, 0.58, 1.0)

        # At midpoint (x=0.5), y should be approximately 0.5
        y_at_half = bezier.solve(0.5)
        assert 0.4 <= y_at_half <= 0.6

    def test_linear_bezier(self):
        """Test linear bezier curve (identity)."""
        from pydoll.interactions.scroll import CubicBezier

        # Linear: control points on the diagonal
        bezier = CubicBezier(0.0, 0.0, 1.0, 1.0)

        # Should be approximately linear
        for x in [0.1, 0.3, 0.5, 0.7, 0.9]:
            y = bezier.solve(x)
            assert abs(y - x) < 0.1, f"Expected y≈{x}, got {y}"


class TestScrollHumanizedMethods:
    """Test humanized scroll methods."""

    @pytest.mark.asyncio
    async def test_scroll_by_with_humanize_true(self, mock_tab):
        """Test scroll.by with humanize=True calls _scroll_humanized."""
        from pydoll.interactions.scroll import Scroll

        scroll = Scroll(mock_tab)

        # Mock _scroll_humanized
        scroll._scroll_humanized = AsyncMock()

        await scroll.by(ScrollPosition.DOWN, 500, humanize=True)

        scroll._scroll_humanized.assert_called_once_with(ScrollPosition.DOWN, 500)

    @pytest.mark.asyncio
    async def test_scroll_to_top_with_humanize_true(self, mock_tab):
        """Test scroll.to_top with humanize=True calls _scroll_to_end_humanized."""
        from pydoll.interactions.scroll import Scroll

        scroll = Scroll(mock_tab)

        # Mock _scroll_to_end_humanized
        scroll._scroll_to_end_humanized = AsyncMock()

        await scroll.to_top(humanize=True)

        scroll._scroll_to_end_humanized.assert_called_once_with(ScrollPosition.UP)

    @pytest.mark.asyncio
    async def test_scroll_to_bottom_with_humanize_true(self, mock_tab):
        """Test scroll.to_bottom with humanize=True calls _scroll_to_end_humanized."""
        from pydoll.interactions.scroll import Scroll

        scroll = Scroll(mock_tab)

        # Mock _scroll_to_end_humanized
        scroll._scroll_to_end_humanized = AsyncMock()

        await scroll.to_bottom(humanize=True)

        scroll._scroll_to_end_humanized.assert_called_once_with(ScrollPosition.DOWN)

    @pytest.mark.asyncio
    async def test_calculate_effective_distance_without_overshoot(self, mock_tab):
        """Test _calculate_effective_distance without overshoot."""
        from pydoll.interactions.scroll import Scroll, ScrollTimingConfig

        # Config with 0% overshoot probability
        config = ScrollTimingConfig(overshoot_probability=0.0)
        scroll = Scroll(mock_tab, timing=config)

        distance = scroll._calculate_effective_distance(100.0)

        assert distance == 100.0

    @pytest.mark.asyncio
    async def test_calculate_effective_distance_with_overshoot(self, mock_tab):
        """Test _calculate_effective_distance with overshoot."""
        from pydoll.interactions.scroll import Scroll, ScrollTimingConfig

        # Config with 100% overshoot probability
        config = ScrollTimingConfig(
            overshoot_probability=1.0,
            overshoot_factor_min=1.1,
            overshoot_factor_max=1.2,
        )
        scroll = Scroll(mock_tab, timing=config)

        distance = scroll._calculate_effective_distance(100.0)

        # Should be between 110 and 120
        assert 110.0 <= distance <= 120.0

    @pytest.mark.asyncio
    async def test_calculate_duration(self, mock_tab):
        """Test _calculate_duration returns value in expected range."""
        from pydoll.interactions.scroll import Scroll, ScrollTimingConfig

        config = ScrollTimingConfig(min_duration=0.5, max_duration=1.5)
        scroll = Scroll(mock_tab, timing=config)

        duration = scroll._calculate_duration(500.0)

        # Should be between min_duration and capped max (3.0)
        assert 0.5 <= duration <= 3.0

    @pytest.mark.asyncio
    async def test_calculate_duration_increases_with_distance(self, mock_tab):
        """Test that longer distances result in longer durations."""
        from pydoll.interactions.scroll import Scroll, ScrollTimingConfig
        from unittest.mock import patch

        config = ScrollTimingConfig(min_duration=0.5, max_duration=1.5)
        scroll = Scroll(mock_tab, timing=config)

        # Patch random.uniform to return a constant base duration
        # This ensures we are testing only the distance scaling logic
        with patch('random.uniform', return_value=1.0):
            short_duration = scroll._calculate_duration(100.0)
            long_duration = scroll._calculate_duration(5000.0)

        # With constant base duration, the formula ensures longer distance -> longer duration
        # Formula: base_duration * (1 + 0.2 * (distance / 1000))
        assert long_duration > short_duration

    @pytest.mark.asyncio
    async def test_get_viewport_center(self, mock_tab):
        """Test _get_viewport_center returns coordinates."""
        from pydoll.interactions.scroll import Scroll

        mock_tab._execute_command.return_value = {
            'result': {'result': {'value': '[800, 600]'}}
        }

        scroll = Scroll(mock_tab)
        result = await scroll._get_viewport_center()

        assert result == (800, 600)

    @pytest.mark.asyncio
    async def test_get_viewport_center_fallback(self, mock_tab):
        """Test _get_viewport_center returns fallback on error."""
        from pydoll.interactions.scroll import Scroll

        mock_tab._execute_command.return_value = {
            'result': {'result': {'value': 'invalid'}}
        }

        scroll = Scroll(mock_tab)
        result = await scroll._get_viewport_center()

        # Should return fallback values
        assert result == (400, 300)

    @pytest.mark.asyncio
    async def test_get_viewport_center_empty_response(self, mock_tab):
        """Test _get_viewport_center handles empty response."""
        from pydoll.interactions.scroll import Scroll

        mock_tab._execute_command.return_value = {}

        scroll = Scroll(mock_tab)
        result = await scroll._get_viewport_center()

        assert result == (400, 300)

    @pytest.mark.asyncio
    async def test_get_current_scroll_y(self, mock_tab):
        """Test _get_current_scroll_y returns scroll position."""
        from pydoll.interactions.scroll import Scroll

        mock_tab._execute_command.return_value = {
            'result': {'result': {'value': 250}}
        }

        scroll = Scroll(mock_tab)
        result = await scroll._get_current_scroll_y()

        assert result == 250.0

    @pytest.mark.asyncio
    async def test_get_current_scroll_y_default(self, mock_tab):
        """Test _get_current_scroll_y returns 0 on missing value."""
        from pydoll.interactions.scroll import Scroll

        mock_tab._execute_command.return_value = {}

        scroll = Scroll(mock_tab)
        result = await scroll._get_current_scroll_y()

        assert result == 0.0

    @pytest.mark.asyncio
    async def test_get_remaining_scroll_to_bottom(self, mock_tab):
        """Test _get_remaining_scroll_to_bottom returns remaining distance."""
        from pydoll.interactions.scroll import Scroll

        mock_tab._execute_command.return_value = {
            'result': {'result': {'value': 1500}}
        }

        scroll = Scroll(mock_tab)
        result = await scroll._get_remaining_scroll_to_bottom()

        assert result == 1500.0

    @pytest.mark.asyncio
    async def test_dispatch_scroll_event(self, mock_tab):
        """Test _dispatch_scroll_event sends mouse wheel event."""
        from pydoll.interactions.scroll import Scroll
        from pydoll.protocol.input.types import MouseEventType

        mock_tab._execute_command.return_value = {
            'result': {'result': {'value': '[400, 300]'}}
        }

        scroll = Scroll(mock_tab)
        await scroll._dispatch_scroll_event(delta_x=0, delta_y=100)

        # Should have called execute_command twice:
        # 1. _get_viewport_center
        # 2. dispatch_mouse_event
        assert mock_tab._execute_command.call_count == 2

        # Check the second call (dispatch_mouse_event)
        second_call = mock_tab._execute_command.call_args_list[1]
        command = second_call[0][0]
        assert command['method'] == 'Input.dispatchMouseEvent'
        assert command['params']['type'] == MouseEventType.MOUSE_WHEEL
        assert command['params']['deltaY'] == 100


class TestScrollWithCustomTiming:
    """Test Scroll with custom timing configuration."""

    def test_scroll_with_custom_timing(self, mock_tab):
        """Test Scroll accepts custom timing configuration."""
        from pydoll.interactions.scroll import Scroll, ScrollTimingConfig

        custom_timing = ScrollTimingConfig(
            min_duration=1.0,
            max_duration=2.0,
        )

        scroll = Scroll(mock_tab, timing=custom_timing)

        assert scroll._timing == custom_timing
        assert scroll._timing.min_duration == 1.0
        assert scroll._timing.max_duration == 2.0

    def test_scroll_uses_default_timing(self, mock_tab):
        """Test Scroll uses default timing if none provided."""
        from pydoll.interactions.scroll import Scroll, ScrollTimingConfig

        scroll = Scroll(mock_tab)

        # Should use default values
        assert scroll._timing.min_duration == 0.5
        assert scroll._timing.max_duration == 1.5


class TestCubicBezierBisectionFallback:
    """Test CubicBezier bisection fallback when Newton's method fails."""

    def test_bisection_fallback_triggered_by_out_of_range_derivative(self):
        """Test that bisection is used when derivative is out of valid range."""
        from pydoll.interactions.scroll import CubicBezier

        # Create a bezier with extreme control points
        # that might cause derivative issues
        bezier = CubicBezier(0.0, 0.0, 1.0, 1.0)  # Linear

        # Should still work correctly
        for x in [0.0, 0.25, 0.5, 0.75, 1.0]:
            result = bezier.solve_curve_x(x)
            assert isinstance(result, float)
            # For linear bezier, t should be close to x
            assert abs(result - x) < 0.1

    def test_bisection_converges_for_edge_cases(self):
        """Test bisection fallback converges for edge case inputs."""
        from pydoll.interactions.scroll import CubicBezier

        bezier = CubicBezier(0.25, 0.1, 0.25, 1.0)

        # Very small values near 0
        result_small = bezier.solve_curve_x(0.001)
        assert isinstance(result_small, float)

        # Values near 1
        result_near_one = bezier.solve_curve_x(0.999)
        assert isinstance(result_near_one, float)

    def test_solve_with_zero_derivative_fallback(self):
        """Test bezier handles cases where derivative could be zero."""
        from pydoll.interactions.scroll import CubicBezier

        # Bezier that starts flat (potential zero derivative at start)
        bezier = CubicBezier(0.0, 0.5, 1.0, 0.5)

        # Should still produce valid results
        for x in [0.1, 0.5, 0.9]:
            result = bezier.solve(x)
            assert 0.0 <= result <= 1.0


class TestScrollHumanized:
    """Test _scroll_humanized method."""

    @pytest.mark.asyncio
    async def test_scroll_humanized_calls_perform_scroll_loop(self, mock_tab):
        """Test _scroll_humanized delegates to _perform_scroll_loop."""
        from pydoll.interactions.scroll import Scroll, ScrollTimingConfig
        from pydoll.constants import ScrollPosition
        from unittest.mock import patch, AsyncMock

        config = ScrollTimingConfig(overshoot_probability=0.0)  # No overshoot
        scroll = Scroll(mock_tab, timing=config)

        # Mock the internal method
        scroll._perform_scroll_loop = AsyncMock(return_value=100.0)

        with patch('asyncio.sleep', new_callable=AsyncMock):
            await scroll._scroll_humanized(ScrollPosition.DOWN, 100.0)

        scroll._perform_scroll_loop.assert_called_once()

    @pytest.mark.asyncio
    async def test_scroll_humanized_with_overshoot_triggers_correction(self, mock_tab):
        """Test _scroll_humanized calls correction when overshoot occurs."""
        from pydoll.interactions.scroll import Scroll, ScrollTimingConfig
        from pydoll.constants import ScrollPosition
        from unittest.mock import patch, AsyncMock

        # Force overshoot
        config = ScrollTimingConfig(
            overshoot_probability=1.0,
            overshoot_factor_min=1.1,
            overshoot_factor_max=1.2,
        )
        scroll = Scroll(mock_tab, timing=config)

        # Mock scroll_loop to return more than target (simulating overshoot)
        scroll._perform_scroll_loop = AsyncMock(return_value=120.0)
        scroll._scroll_correction = AsyncMock()

        with patch('asyncio.sleep', new_callable=AsyncMock):
            await scroll._scroll_humanized(ScrollPosition.DOWN, 100.0)

        # Correction should be called because scrolled (120) > target (100)
        scroll._scroll_correction.assert_called_once()


class TestScrollToEndHumanized:
    """Test _scroll_to_end_humanized method."""

    @pytest.mark.asyncio
    async def test_scroll_to_end_down_calls_humanized_scroll(self, mock_tab):
        """Test scrolling to bottom uses _scroll_humanized in loop."""
        from pydoll.interactions.scroll import Scroll
        from pydoll.constants import ScrollPosition
        from unittest.mock import patch, AsyncMock

        scroll = Scroll(mock_tab)

        # First call: lots remaining, second call: none remaining
        call_count = [0]
        async def mock_remaining():
            call_count[0] += 1
            return 500.0 if call_count[0] == 1 else 0.0

        scroll._get_remaining_scroll_to_bottom = mock_remaining
        scroll._scroll_humanized = AsyncMock()

        with patch('asyncio.sleep', new_callable=AsyncMock):
            await scroll._scroll_to_end_humanized(ScrollPosition.DOWN)

        # Should have called _scroll_humanized at least once
        assert scroll._scroll_humanized.call_count >= 1

    @pytest.mark.asyncio
    async def test_scroll_to_end_up_uses_current_scroll_y(self, mock_tab):
        """Test scrolling to top checks current scroll position."""
        from pydoll.interactions.scroll import Scroll
        from pydoll.constants import ScrollPosition
        from unittest.mock import patch, AsyncMock

        scroll = Scroll(mock_tab)

        # First call: has scroll position, second call: at top
        call_count = [0]
        async def mock_scroll_y():
            call_count[0] += 1
            return 300.0 if call_count[0] == 1 else 0.0

        scroll._get_current_scroll_y = mock_scroll_y
        scroll._scroll_humanized = AsyncMock()

        with patch('asyncio.sleep', new_callable=AsyncMock):
            await scroll._scroll_to_end_humanized(ScrollPosition.UP)

        # Should have called _scroll_humanized
        assert scroll._scroll_humanized.call_count >= 1

    @pytest.mark.asyncio
    async def test_scroll_to_end_stops_when_threshold_reached(self, mock_tab):
        """Test loop stops when remaining distance is below threshold."""
        from pydoll.interactions.scroll import Scroll
        from pydoll.constants import ScrollPosition
        from unittest.mock import patch, AsyncMock

        scroll = Scroll(mock_tab)

        # Return value below threshold (30)
        scroll._get_remaining_scroll_to_bottom = AsyncMock(return_value=10.0)
        scroll._scroll_humanized = AsyncMock()

        with patch('asyncio.sleep', new_callable=AsyncMock):
            await scroll._scroll_to_end_humanized(ScrollPosition.DOWN)

        # Should NOT have called _scroll_humanized (already at end)
        scroll._scroll_humanized.assert_not_called()

    @pytest.mark.asyncio
    async def test_scroll_to_end_stops_when_stuck(self, mock_tab):
        """Test loop stops when scroll progress is stuck."""
        from pydoll.interactions.scroll import Scroll
        from pydoll.constants import ScrollPosition
        from unittest.mock import patch, AsyncMock

        scroll = Scroll(mock_tab)

        # Always return same remaining distance (stuck)
        scroll._get_remaining_scroll_to_bottom = AsyncMock(return_value=500.0)
        scroll._scroll_humanized = AsyncMock()

        with patch('asyncio.sleep', new_callable=AsyncMock):
            await scroll._scroll_to_end_humanized(ScrollPosition.DOWN)

        # Should have tried a few times then given up
        # We set max_stuck_attempts = 10, so it should be around 10 calls
        assert scroll._scroll_humanized.call_count >= 10
        assert scroll._scroll_humanized.call_count < 20  # Should not loop infinitely


class TestPerformScrollLoop:
    """Test _perform_scroll_loop method."""

    @pytest.mark.asyncio
    async def test_perform_scroll_loop_dispatches_events(self, mock_tab):
        """Test scroll loop dispatches mouse wheel events."""
        from pydoll.interactions.scroll import Scroll, ScrollTimingConfig
        from unittest.mock import patch, AsyncMock, MagicMock

        mock_tab._execute_command.return_value = {
            'result': {'result': {'value': '[400, 300]'}}
        }

        config = ScrollTimingConfig(
            min_duration=0.01,
            max_duration=0.02,
            frame_interval=0.001,
            micro_pause_probability=0.0,
        )
        scroll = Scroll(mock_tab, timing=config)

        # Mock time to advance in steps
        # Start at 0, then 0.005 (halfway), then 0.02 (end)
        mock_loop = MagicMock()
        mock_loop.time.side_effect = [0.0, 0.005, 0.02]

        with patch('asyncio.get_running_loop', return_value=mock_loop):
            with patch('asyncio.sleep', new_callable=AsyncMock):
                scrolled = await scroll._perform_scroll_loop(
                    effective_distance=100.0,
                    duration=0.01,
                    is_vertical=True,
                    direction=1,
                )

        # Should have dispatched at least one event
        assert mock_tab._execute_command.call_count >= 1
        assert isinstance(scrolled, float)

    @pytest.mark.asyncio
    async def test_perform_scroll_loop_horizontal(self, mock_tab):
        """Test scroll loop handles horizontal scrolling."""
        from pydoll.interactions.scroll import Scroll, ScrollTimingConfig
        from unittest.mock import patch, AsyncMock

        mock_tab._execute_command.return_value = {
            'result': {'result': {'value': '[400, 300]'}}
        }

        config = ScrollTimingConfig(
            min_duration=0.01,
            max_duration=0.02,
            frame_interval=0.001,
            micro_pause_probability=0.0,
        )
        scroll = Scroll(mock_tab, timing=config)

        with patch('asyncio.sleep', new_callable=AsyncMock):
            scrolled = await scroll._perform_scroll_loop(
                effective_distance=50.0,
                duration=0.01,
                is_vertical=False,  # Horizontal
                direction=-1,  # Left
            )

        assert isinstance(scrolled, float)

    @pytest.mark.asyncio
    async def test_perform_scroll_loop_returns_scrolled_amount(self, mock_tab):
        """Test scroll loop returns total scrolled distance."""
        from pydoll.interactions.scroll import Scroll, ScrollTimingConfig
        from unittest.mock import patch, AsyncMock

        mock_tab._execute_command.return_value = {
            'result': {'result': {'value': '[400, 300]'}}
        }

        config = ScrollTimingConfig(
            min_duration=0.05,
            max_duration=0.05,
            frame_interval=0.001,
            micro_pause_probability=0.0,
            delta_jitter=0,  # No jitter for predictable test
        )
        scroll = Scroll(mock_tab, timing=config)

        with patch('asyncio.sleep', new_callable=AsyncMock):
            scrolled = await scroll._perform_scroll_loop(
                effective_distance=100.0,
                duration=0.05,
                is_vertical=True,
                direction=1,
            )

        # Should have scrolled some amount
        assert scrolled > 0


class TestScrollCorrection:
    """Test _scroll_correction method."""

    @pytest.mark.asyncio
    async def test_scroll_correction_dispatches_scroll_events(self, mock_tab):
        """Test correction dispatches scroll events progressively."""
        from pydoll.interactions.scroll import Scroll, ScrollTimingConfig
        from unittest.mock import AsyncMock
        import asyncio

        config = ScrollTimingConfig(frame_interval=0.001)
        scroll = Scroll(mock_tab, timing=config)

        # Track calls to _dispatch_scroll_event
        dispatch_calls = []
        original_dispatch = scroll._dispatch_scroll_event

        async def tracking_dispatch(delta_x, delta_y):
            dispatch_calls.append((delta_x, delta_y))

        scroll._dispatch_scroll_event = tracking_dispatch

        # Run with timeout to prevent hanging
        try:
            await asyncio.wait_for(
                scroll._scroll_correction(
                    is_vertical=True,
                    direction=-1,
                    distance=10.0,
                ),
                timeout=2.0,
            )
        except asyncio.TimeoutError:
            pass  # Test passed if we got here with some calls

        # Should have dispatched at least one event
        assert len(dispatch_calls) >= 1

    @pytest.mark.asyncio
    async def test_scroll_correction_horizontal(self, mock_tab):
        """Test correction works for horizontal scrolling."""
        from pydoll.interactions.scroll import Scroll, ScrollTimingConfig
        import asyncio

        # Use larger frame_interval so delta is >= 1
        config = ScrollTimingConfig(frame_interval=0.01)
        scroll = Scroll(mock_tab, timing=config)

        dispatch_calls = []

        async def tracking_dispatch(delta_x, delta_y):
            dispatch_calls.append((delta_x, delta_y))

        scroll._dispatch_scroll_event = tracking_dispatch

        try:
            await asyncio.wait_for(
                scroll._scroll_correction(
                    is_vertical=False,
                    direction=1,
                    distance=10.0,
                ),
                timeout=2.0,
            )
        except asyncio.TimeoutError:
            pass

        # Should have dispatched at least one event
        assert len(dispatch_calls) >= 1

    @pytest.mark.asyncio
    async def test_scroll_correction_velocity_decreases(self, mock_tab):
        """Test correction velocity decreases over time."""
        from pydoll.interactions.scroll import Scroll, ScrollTimingConfig
        import asyncio

        config = ScrollTimingConfig(frame_interval=0.001)
        scroll = Scroll(mock_tab, timing=config)

        call_deltas = []

        async def tracking_dispatch(delta_x, delta_y):
            call_deltas.append(abs(delta_y))

        scroll._dispatch_scroll_event = tracking_dispatch

        try:
            await asyncio.wait_for(
                scroll._scroll_correction(
                    is_vertical=True,
                    direction=1,
                    distance=50.0,
                ),
                timeout=2.0,
            )
        except asyncio.TimeoutError:
            pass

        # Velocity should be decreasing (later deltas smaller)
        if len(call_deltas) >= 2:
            assert call_deltas[0] >= call_deltas[-1]


class TestPublicMethodsWithHumanize:
    """Test that public methods correctly route to humanized methods."""

    @pytest.mark.asyncio
    async def test_by_with_humanize_calls_scroll_humanized(self, mock_tab):
        """Test by() with humanize=True routes to _scroll_humanized."""
        from pydoll.interactions.scroll import Scroll
        from pydoll.constants import ScrollPosition
        from unittest.mock import AsyncMock

        scroll = Scroll(mock_tab)
        scroll._scroll_humanized = AsyncMock()

        await scroll.by(ScrollPosition.DOWN, 100, humanize=True)

        scroll._scroll_humanized.assert_called_once_with(ScrollPosition.DOWN, 100)

    @pytest.mark.asyncio
    async def test_to_top_with_humanize_calls_scroll_to_end_humanized(self, mock_tab):
        """Test to_top() with humanize=True routes to _scroll_to_end_humanized."""
        from pydoll.interactions.scroll import Scroll
        from pydoll.constants import ScrollPosition
        from unittest.mock import AsyncMock

        scroll = Scroll(mock_tab)
        scroll._scroll_to_end_humanized = AsyncMock()

        await scroll.to_top(humanize=True)

        scroll._scroll_to_end_humanized.assert_called_once_with(ScrollPosition.UP)

    @pytest.mark.asyncio
    async def test_to_bottom_with_humanize_calls_scroll_to_end_humanized(self, mock_tab):
        """Test to_bottom() with humanize=True routes to _scroll_to_end_humanized."""
        from pydoll.interactions.scroll import Scroll
        from pydoll.constants import ScrollPosition
        from unittest.mock import AsyncMock

        scroll = Scroll(mock_tab)
        scroll._scroll_to_end_humanized = AsyncMock()

        await scroll.to_bottom(humanize=True)

        scroll._scroll_to_end_humanized.assert_called_once_with(ScrollPosition.DOWN)


class TestScrollAPIBackwardCompatibility:
    """Test backward compatibility alias."""

    def test_scroll_api_alias(self):
        """Test ScrollAPI is an alias for Scroll."""
        from pydoll.interactions.scroll import Scroll, ScrollAPI

        assert ScrollAPI is Scroll


================================================
FILE: tests/test_managers/test_browser_managers.py
================================================
from unittest.mock import MagicMock, Mock, patch, ANY

import pytest

from pydoll.browser.managers import (
    ChromiumOptionsManager,
    BrowserProcessManager,
    ProxyManager,
    TempDirectoryManager,
)
from pydoll.browser.options import ChromiumOptions as Options
from pydoll.exceptions import InvalidOptionsObject


@pytest.fixture
def proxy_options():
    return Options()


@pytest.fixture
def temp_manager():
    mock_dir = MagicMock()
    mock_dir.name = '/fake/temp/dir'
    return TempDirectoryManager(temp_dir_factory=lambda: mock_dir)


@pytest.fixture
def process_manager():
    mock_creator = Mock(return_value=MagicMock())
    return BrowserProcessManager(process_creator=mock_creator)


@pytest.fixture
def chromium_options_manager(proxy_options):
    options_manager = ChromiumOptionsManager(proxy_options)
    return options_manager


def test_proxy_manager_no_proxy(proxy_options):
    manager = ProxyManager(proxy_options)
    result = manager.get_proxy_credentials()

    assert result[0] is False
    assert result[1] == (None, None)


def test_proxy_manager_with_credentials(proxy_options):
    proxy_options.add_argument('--proxy-server=user:pass@example.com')
    manager = ProxyManager(proxy_options)
    result = manager.get_proxy_credentials()

    assert result[0] is True
    assert result[1] == ('user', 'pass')
    assert proxy_options.arguments == ['--proxy-server=example.com']


def test_proxy_manager_invalid_credentials_format(proxy_options):
    proxy_options.add_argument('--proxy-server=invalidformat@example.com')
    manager = ProxyManager(proxy_options)
    result = manager.get_proxy_credentials()

    assert result[0] is False
    assert result[1] == (None, None)
    assert proxy_options.arguments == [
        '--proxy-server=invalidformat@example.com'
    ]


def test_proxy_manager_with_scheme_http(proxy_options):
    proxy_options.add_argument('--proxy-server=http://user:pass@proxy.local:8080')
    manager = ProxyManager(proxy_options)
    result = manager.get_proxy_credentials()

    assert result[0] is True
    assert result[1] == ('user', 'pass')
    assert proxy_options.arguments == ['--proxy-server=http://proxy.local:8080']


def test_proxy_manager_with_scheme_socks(proxy_options):
    proxy_options.add_argument('--proxy-server=socks5://alice:pwd@1.2.3.4:1080')
    manager = ProxyManager(proxy_options)
    result = manager.get_proxy_credentials()

    assert result[0] is True
    assert result[1] == ('alice', 'pwd')
    assert proxy_options.arguments == ['--proxy-server=socks5://1.2.3.4:1080']


def test_proxy_manager_invalid_proxy_format(proxy_options):
    proxy_options.add_argument('--proxy-server=invalidformat')
    manager = ProxyManager(proxy_options)
    result = manager.get_proxy_credentials()

    assert result[0] is False
    assert result[1] == (None, None)


def test_start_browser_process(process_manager):
    binary = '/fake/path/browser'
    port = 9222
    args = ['--test-arg']

    process_manager.start_browser_process(binary, port, args)

    expected_command = [binary, f'--remote-debugging-port={port}', *args]
    process_manager._process_creator.assert_called_once_with(expected_command)
    assert process_manager._process is not None


def test_stop_process(process_manager):
    mock_process = MagicMock()
    process_manager._process = mock_process

    process_manager.stop_process()

    mock_process.terminate.assert_called_once()


def test_create_temp_dir(temp_manager):
    temp_dir = temp_manager.create_temp_dir()

    assert len(temp_manager._temp_dirs) == 1
    assert temp_dir.name == '/fake/temp/dir'


def test_cleanup_temp_dirs(temp_manager):
    mock_dir1 = MagicMock()
    mock_dir2 = MagicMock()
    temp_manager._temp_dirs = [mock_dir1, mock_dir2]

    with patch('shutil.rmtree') as mock_rmtree:
        temp_manager.cleanup()

        assert mock_rmtree.call_count == 2
        mock_rmtree.assert_any_call(mock_dir1.name, onerror=ANY)
        mock_rmtree.assert_any_call(mock_dir2.name, onerror=ANY)


def test_retry_process_file(temp_manager):
    mock_func = Mock()

    # retry success
    success_at = 5
    mock_func.side_effect = [PermissionError] * (success_at - 1) + [None]
    temp_manager.retry_process_file(mock_func, "/test/path", retry_times=success_at)
    assert mock_func.call_count == success_at
    
    # exceed max retries
    mock_func.reset_mock()
    mock_func.side_effect = PermissionError
    with pytest.raises(PermissionError):
        temp_manager.retry_process_file(mock_func, "/test/path", retry_times=3)
    assert mock_func.call_count == 3

    # infinite_retries
    mock_func.reset_mock()
    mock_func.side_effect = [PermissionError] * 9 + [None]
    temp_manager.retry_process_file(mock_func, "/test/path", retry_times=-1)
    assert mock_func.call_count == 10


def test_handle_cleanup_error(temp_manager):
    func_mock = Mock()

    # matched permission error
    temp_manager.retry_process_file = Mock()
    path = "/tmp/CrashpadMetrics-active.pma"

    temp_manager.handle_cleanup_error(func_mock, path, (PermissionError, PermissionError(), None))
    temp_manager.retry_process_file.assert_called_once_with(func_mock, path)

    # matched permission error - should not raise, only log and continue
    temp_manager.retry_process_file = Mock()
    temp_manager.retry_process_file.side_effect = PermissionError
    path = "/tmp/CrashpadMetrics-active.pma"
    temp_manager.handle_cleanup_error(func_mock, path, (PermissionError, PermissionError(), None))

    # unmatched permission error
    temp_manager.retry_process_file = Mock()
    path = "/tmp/test.file"
    exc = PermissionError("Access denied")

    with pytest.raises(PermissionError) as e:
        temp_manager.handle_cleanup_error(func_mock, path, (PermissionError, exc, None))
    assert e.value is exc

    # pass OSError
    temp_manager.handle_cleanup_error(func_mock, "/tmp/path", (OSError, OSError(), None))

    # raise other Exception
    exc = ValueError("Test")
    with pytest.raises(ValueError) as e:
        temp_manager.handle_cleanup_error(func_mock, "/tmp/path", (ValueError, exc, None))
    assert e.value is exc


def test_initialize_options_with_none(chromium_options_manager):
    result = chromium_options_manager.initialize_options()

    assert isinstance(result, Options)
    assert result.arguments == ['--no-first-run', '--no-default-browser-check']


def test_initialize_options_with_valid_options():
    options = Options()
    options.add_argument('--test')
    chromium_options_manager = ChromiumOptionsManager(options)
    result = chromium_options_manager.initialize_options()

    assert result is options
    assert '--test' in result.arguments


def test_initialize_options_with_invalid_type():
    chromium_options_manager = ChromiumOptionsManager('invalid options object')
    with pytest.raises(InvalidOptionsObject):
        chromium_options_manager.initialize_options()


def test_add_default_arguments():
    options = Options()
    chromium_options_manager = ChromiumOptionsManager(options)
    chromium_options_manager.add_default_arguments()

    assert '--no-first-run' in options.arguments
    assert '--no-default-browser-check' in options.arguments


def test_initialize_options_creates_new_instance():
    manager = ChromiumOptionsManager(None)
    result = manager.initialize_options()
    assert isinstance(result, Options)
    assert '--no-first-run' in result.arguments
    assert '--no-default-browser-check' in result.arguments


def test_initialize_options_preserves_custom_arguments():
    options = Options()
    options.add_argument('--custom-flag')
    manager = ChromiumOptionsManager(options)
    result = manager.initialize_options()
    assert '--custom-flag' in result.arguments
    assert '--no-first-run' in result.arguments
    assert '--no-default-browser-check' in result.arguments


================================================
FILE: tests/test_managers/test_connection_managers.py
================================================
import pytest

from pydoll import exceptions
from pydoll.connection.managers import CommandsManager, EventsManager


@pytest.fixture
def commands_manager():
    """Retorna uma instância fresca de CommandManager para os testes."""
    return CommandsManager()


@pytest.fixture
def events_manager():
    """Retorna uma instância fresca de EventsManager para os testes."""
    return EventsManager()


def test_create_command_future(commands_manager):
    test_command = {'method': 'TestMethod'}
    future_result = commands_manager.create_command_future(test_command)

    # Verifica se o ID foi atribuído corretamente
    assert test_command['id'] == 1, 'The first command ID should be 1'
    # Verifica se o future foi armazenado no dicionário de pendentes
    assert 1 in commands_manager._pending_commands
    assert commands_manager._pending_commands[1] is future_result

    # Cria um segundo comando e verifica o incremento do ID
    second_command = {'method': 'SecondMethod'}
    future_second = commands_manager.create_command_future(second_command)
    assert second_command['id'] == 2, 'The second command ID should be 2'
    assert 2 in commands_manager._pending_commands
    assert commands_manager._pending_commands[2] is future_second


def test_resolve_command(commands_manager):
    test_command = {'method': 'TestMethod'}
    future_result = commands_manager.create_command_future(test_command)
    result_payload = '{"result": "success"}'

    # O future não deve estar concluído antes da resolução
    assert not future_result.done(), (
        'The future should not be completed before resolution'
    )

    # Resolve o comando e verifica o resultado
    commands_manager.resolve_command(1, result_payload)
    assert future_result.done(), (
        'The future should be completed after resolution'
    )
    assert future_result.result() == result_payload, (
        'The future result does not match the expected result'
    )
    # O comando pendente deve ser removido
    assert 1 not in commands_manager._pending_commands


def test_resolve_unknown_command(commands_manager):
    test_command = {'method': 'TestMethod'}
    future_result = commands_manager.create_command_future(test_command)

    # Tenta resolver um ID inexistente; o future original deve permanecer pendente
    commands_manager.resolve_command(999, '{"result": "ignored"}')
    assert not future_result.done(), (
        'The future should not be completed after resolving an unknown command'
    )


def test_remove_pending_command(commands_manager):
    test_command = {'method': 'TestMethod'}
    _ = commands_manager.create_command_future(test_command)

    # Remove o comando pendente e verifica se ele foi removido
    commands_manager.remove_pending_command(1)
    assert 1 not in commands_manager._pending_commands, (
        'The pending command should be removed'
    )
    commands_manager.remove_pending_command(1)


def test_register_callback_success(events_manager):
    dummy_callback = lambda event: event
    callback_id = events_manager.register_callback('TestEvent', dummy_callback)

    assert callback_id == 1, 'The first callback ID should be 1'
    assert callback_id in events_manager._event_callbacks, (
        'The callback must be registered'
    )
    callback_info = events_manager._event_callbacks[callback_id]
    assert callback_info['temporary'] is False, (
        'The temporary flag should be False by default'
    )


def test_remove_existing_callback(events_manager):
    dummy_callback = lambda event: event
    callback_id = events_manager.register_callback('TestEvent', dummy_callback)
    removal_result = events_manager.remove_callback(callback_id)

    assert removal_result is True, (
        'The removal of a existing callback should be successful'
    )
    assert callback_id not in events_manager._event_callbacks, (
        'The callback should be removed'
    )


def test_remove_nonexistent_callback(events_manager):
    removal_result = events_manager.remove_callback(999)
    assert removal_result is False, (
        'The removal of a nonexistent callback should return False'
    )


def test_clear_callbacks(events_manager):
    dummy_callback = lambda event: event
    events_manager.register_callback('EventA', dummy_callback)
    events_manager.register_callback('EventB', dummy_callback)

    events_manager.clear_callbacks()
    assert len(events_manager._event_callbacks) == 0, (
        'All callbacks should be cleared'
    )


@pytest.mark.asyncio
async def test_process_event_updates_network_logs(events_manager):
    assert events_manager.network_logs == []
    network_event = {
        'method': 'Network.requestWillBeSent',
        'url': 'http://example.com',
    }

    await events_manager.process_event(network_event)

    assert network_event in events_manager.network_logs, (
        'The network event should be added to the logs'
    )


@pytest.mark.asyncio
async def test_process_event_triggers_callbacks(events_manager):
    callback_results = []

    def sync_callback(event):
        callback_results.append(('sync', event.get('value')))

    async def async_callback(event):
        callback_results.append(('async', event.get('value')))

    sync_callback_id = events_manager.register_callback(
        'MyCustomEvent', sync_callback, temporary=True
    )
    async_callback_id = events_manager.register_callback(
        'MyCustomEvent', async_callback, temporary=False
    )

    test_event = {'method': 'MyCustomEvent', 'value': 123}
    await events_manager.process_event(test_event)

    assert ('sync', 123) in callback_results, (
        'The synchronous callback was not triggered correctly'
    )
    assert ('async', 123) in callback_results, (
        'The asynchronous callback was not triggered correctly'
    )

    assert sync_callback_id not in events_manager._event_callbacks, (
        'The temporary callback should be removed after execution'
    )

    assert async_callback_id in events_manager._event_callbacks, (
        'The permanent callback should remain registered'
    )


@pytest.mark.asyncio
async def test_trigger_callbacks_error_handling(events_manager, caplog):
    def faulty_callback(event):
        raise ValueError('Error in callback')

    faulty_callback_id = events_manager.register_callback(
        'ErrorEvent', faulty_callback, temporary=True
    )
    test_event = {'method': 'ErrorEvent'}

    await events_manager.process_event(test_event)
    assert faulty_callback_id not in events_manager._event_callbacks, (
        'The callback with error should be removed after execution'
    )
    error_logged = any(
        'Error in callback' in record.message for record in caplog.records
    )
    assert error_logged, 'The error in the callback should be logged'


================================================
FILE: tests/test_nested_oopif_integration.py
================================================
"""Integration tests for nested cross-origin iframe (OOPIF) resolution.

Two HTTP servers on different ports simulate cross-origin boundaries,
triggering Chrome's site isolation (OOPIF) mechanism. Tests verify
that Pydoll correctly routes CDP commands through the right session
handler when resolving nested iframes inside OOPIFs.
"""

import asyncio
import http.server
import socket
import threading
from pathlib import Path

import pytest

from pydoll.browser.chromium import Chrome

PAGES_DIR = Path(__file__).parent / 'pages' / 'oopif'


class _SilentHandler(http.server.SimpleHTTPRequestHandler):
    def log_message(self, *args):
        pass


def _wait_for_server(host: str, port: int, timeout: float = 5.0) -> None:
    """Block until the server at host:port accepts a TCP connection."""
    import time

    deadline = time.monotonic() + timeout
    while time.monotonic() < deadline:
        try:
            with socket.create_connection((host, port), timeout=0.5):
                return
        except OSError:
            time.sleep(0.05)
    raise RuntimeError(f'Server {host}:{port} not ready within {timeout}s')


@pytest.fixture(scope='module')
def cross_origin_servers():
    """Two HTTP servers on different ports -> different origins -> OOPIF."""

    def _handler():
        class H(_SilentHandler):
            def __init__(self, *a, **kw):
                super().__init__(*a, directory=str(PAGES_DIR), **kw)

        return H

    srv_a = http.server.HTTPServer(('127.0.0.1', 0), _handler())
    srv_b = http.server.HTTPServer(('127.0.0.1', 0), _handler())
    port_a = srv_a.server_address[1]
    port_b = srv_b.server_address[1]

    for srv in (srv_a, srv_b):
        threading.Thread(target=srv.serve_forever, daemon=True).start()

    _wait_for_server('127.0.0.1', port_a)
    _wait_for_server('127.0.0.1', port_b)

    yield port_a, port_b

    srv_a.shutdown()
    srv_b.shutdown()


class TestCrossOriginIframeResolution:
    """Finding elements inside cross-origin (OOPIF) iframes."""

    @pytest.mark.asyncio
    async def test_find_element_in_cross_origin_iframe(
        self, ci_chrome_options, cross_origin_servers
    ):
        port_a, port_b = cross_origin_servers
        url = f'http://127.0.0.1:{port_a}/oopif_main.html?port={port_b}'

        ci_chrome_options.add_argument('--site-per-process')
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(url)

            iframe = await tab.find(id='cross-origin-iframe', timeout=10)
            assert iframe.is_iframe

            heading = await iframe.find(id='oopif-heading', timeout=10)
            assert await heading.text == 'Cross-Origin Content'

    @pytest.mark.asyncio
    async def test_click_button_in_cross_origin_iframe(
        self, ci_chrome_options, cross_origin_servers
    ):
        port_a, port_b = cross_origin_servers
        url = f'http://127.0.0.1:{port_a}/oopif_main.html?port={port_b}'

        ci_chrome_options.add_argument('--site-per-process')
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(url)

            iframe = await tab.find(id='cross-origin-iframe', timeout=10)
            btn = await iframe.find(id='oopif-btn', timeout=10)
            counter = await iframe.find(id='oopif-btn-count', timeout=10)

            assert await counter.text == '0'
            await btn.click()
            await asyncio.sleep(0.3)
            assert await counter.text == '1'


class TestNestedIframeInsideOopif:
    """Finding elements in iframes nested inside cross-origin iframes."""

    @pytest.mark.asyncio
    async def test_find_element_in_nested_iframe_inside_oopif(
        self, ci_chrome_options, cross_origin_servers
    ):
        """Navigate: main -> OOPIF -> nested iframe -> find element."""
        port_a, port_b = cross_origin_servers
        url = f'http://127.0.0.1:{port_a}/oopif_main.html?port={port_b}'

        ci_chrome_options.add_argument('--site-per-process')
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(url)

            oopif = await tab.find(id='cross-origin-iframe', timeout=10)
            nested = await oopif.find(id='nested-iframe', timeout=10)
            assert nested.is_iframe

            heading = await nested.find(id='nested-heading', timeout=10)
            assert await heading.text == 'Nested Iframe Content'

    @pytest.mark.asyncio
    async def test_type_text_in_nested_iframe_inside_oopif(
        self, ci_chrome_options, cross_origin_servers
    ):
        """Type text into an input inside a nested iframe within an OOPIF."""
        port_a, port_b = cross_origin_servers
        url = f'http://127.0.0.1:{port_a}/oopif_main.html?port={port_b}'

        ci_chrome_options.add_argument('--site-per-process')
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(url)

            oopif = await tab.find(id='cross-origin-iframe', timeout=10)
            nested = await oopif.find(id='nested-iframe', timeout=10)

            input_el = await nested.find(id='nested-input', timeout=10)
            await input_el.type_text('hello from nested oopif')
            await asyncio.sleep(0.3)
            prop = await input_el.execute_script(
                'return this.value', return_by_value=True
            )
            assert prop['result']['result']['value'] == 'hello from nested oopif'


class TestShadowRootInsideOopif:
    """Discovering and interacting with shadow roots inside OOPIFs."""

    @pytest.mark.asyncio
    async def test_find_shadow_roots_inside_oopif(
        self, ci_chrome_options, cross_origin_servers
    ):
        """find_shadow_roots(True) should discover shadow roots across OOPIFs."""
        port_a, port_b = cross_origin_servers
        url = f'http://127.0.0.1:{port_a}/oopif_main.html?port={port_b}'

        ci_chrome_options.add_argument('--site-per-process')
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(url)

            shadow_roots = await tab.find_shadow_roots(True, timeout=10)
            for sr in shadow_roots:
                html = await sr.inner_html
                if 'Shadow content inside OOPIF' in html:
                    text_el = await sr.query('#shadow-text', timeout=10)
                    assert await text_el.text == 'Shadow content inside OOPIF'
                    return

            pytest.fail('Shadow root inside OOPIF not found via find_shadow_roots')

    @pytest.mark.asyncio
    async def test_click_button_in_shadow_root_inside_oopif(
        self, ci_chrome_options, cross_origin_servers
    ):
        port_a, port_b = cross_origin_servers
        url = f'http://127.0.0.1:{port_a}/oopif_main.html?port={port_b}'

        ci_chrome_options.add_argument('--site-per-process')
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(url)

            shadow_roots = await tab.find_shadow_roots(True, timeout=10)
            for sr in shadow_roots:
                html = await sr.inner_html
                if 'Shadow content inside OOPIF' in html:
                    btn = await sr.query('#shadow-btn', timeout=10)
                    counter = await sr.query('#shadow-btn-count', timeout=10)
                    assert await counter.text == '0'

                    await btn.click()
                    await asyncio.sleep(0.3)
                    assert await counter.text == '1'
                    return

            pytest.fail('Shadow root inside OOPIF not found')


class TestIframeInsideShadowRootInsideOopif:
    """The exact bug scenario: main -> OOPIF -> shadow root -> iframe."""

    @pytest.mark.asyncio
    async def test_find_element_in_iframe_inside_shadow_in_oopif(
        self, ci_chrome_options, cross_origin_servers
    ):
        """This reproduces the original bug where IFrameContextResolver
        failed with InvalidIFrame because DOM.getFrameOwner was routed
        through the wrong session handler.
        """
        port_a, port_b = cross_origin_servers
        url = f'http://127.0.0.1:{port_a}/oopif_main.html?port={port_b}'

        ci_chrome_options.add_argument('--site-per-process')
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(url)

            shadow_roots = await tab.find_shadow_roots(True, timeout=10)
            for sr in shadow_roots:
                html = await sr.inner_html
                if 'Shadow content inside OOPIF' in html:
                    iframe = await sr.query('#shadow-iframe', timeout=10)
                    assert iframe.is_iframe

                    heading = await iframe.find(
                        id='shadow-iframe-heading', timeout=10
                    )
                    assert await heading.text == 'Shadow Iframe Content'
                    return

            pytest.fail('Shadow root inside OOPIF not found')

    @pytest.mark.asyncio
    async def test_type_text_in_iframe_inside_shadow_in_oopif(
        self, ci_chrome_options, cross_origin_servers
    ):
        """Type text through: main -> OOPIF -> shadow root -> iframe -> input."""
        port_a, port_b = cross_origin_servers
        url = f'http://127.0.0.1:{port_a}/oopif_main.html?port={port_b}'

        ci_chrome_options.add_argument('--site-per-process')
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(url)

            shadow_roots = await tab.find_shadow_roots(True, timeout=10)
            for sr in shadow_roots:
                html = await sr.inner_html
                if 'Shadow content inside OOPIF' in html:
                    iframe = await sr.query('#shadow-iframe', timeout=10)
                    input_el = await iframe.find(
                        id='shadow-iframe-input', timeout=10
                    )
                    await input_el.type_text('deep nested text')
                    await asyncio.sleep(0.3)
                    prop = await input_el.execute_script(
                        'return this.value', return_by_value=True
                    )
                    assert prop['result']['result']['value'] == 'deep nested text'
                    return

            pytest.fail('Shadow root inside OOPIF not found')


================================================
FILE: tests/test_shadow_root.py
================================================
import uuid
from unittest.mock import AsyncMock, MagicMock, patch

import pytest
import pytest_asyncio

from pydoll.browser.tab import Tab
from pydoll.elements.shadow_root import ShadowRoot
from pydoll.elements.web_element import WebElement
from pydoll.exceptions import (
    CommandExecutionTimeout,
    ElementNotFound,
    ShadowRootNotFound,
    WaitElementTimeout,
    WebSocketConnectionClosed,
)
from pydoll.interactions.iframe import IFrameContext
from pydoll.protocol.dom.types import ShadowRootType


@pytest_asyncio.fixture
async def mock_connection_handler():
    """Mock connection handler for ShadowRoot tests."""
    with patch('pydoll.connection.ConnectionHandler', autospec=True) as mock:
        handler = mock.return_value
        handler.execute_command = AsyncMock()
        yield handler


@pytest.fixture
def shadow_root(mock_connection_handler):
    """Basic ShadowRoot fixture with open mode."""
    return ShadowRoot(
        object_id='shadow-root-object-id',
        connection_handler=mock_connection_handler,
        mode=ShadowRootType.OPEN,
    )


@pytest.fixture
def host_element(mock_connection_handler):
    """WebElement fixture acting as shadow host."""
    return WebElement(
        object_id='host-object-id',
        connection_handler=mock_connection_handler,
        method='css',
        selector='#host',
        attributes_list=['id', 'host', 'tag_name', 'div'],
    )


class TestShadowRootInit:
    """Tests for ShadowRoot initialization."""

    def test_init_with_defaults(self, mock_connection_handler):
        sr = ShadowRoot(
            object_id='sr-id',
            connection_handler=mock_connection_handler,
        )
        assert sr._object_id == 'sr-id'
        assert sr._connection_handler is mock_connection_handler
        assert sr._mode == ShadowRootType.OPEN
        assert sr._host_element is None

    def test_init_with_all_params(self, mock_connection_handler, host_element):
        sr = ShadowRoot(
            object_id='sr-id',
            connection_handler=mock_connection_handler,
            mode=ShadowRootType.CLOSED,
            host_element=host_element,
        )
        assert sr._object_id == 'sr-id'
        assert sr._mode == ShadowRootType.CLOSED
        assert sr._host_element is host_element

    def test_init_with_user_agent_mode(self, mock_connection_handler):
        sr = ShadowRoot(
            object_id='sr-id',
            connection_handler=mock_connection_handler,
            mode=ShadowRootType.USER_AGENT,
        )
        assert sr._mode == ShadowRootType.USER_AGENT


class TestShadowRootProperties:
    """Tests for ShadowRoot properties."""

    def test_mode_property(self, shadow_root):
        assert shadow_root.mode == ShadowRootType.OPEN

    def test_host_element_none(self, shadow_root):
        assert shadow_root.host_element is None

    def test_host_element_with_reference(self, mock_connection_handler, host_element):
        sr = ShadowRoot(
            object_id='sr-id',
            connection_handler=mock_connection_handler,
            host_element=host_element,
        )
        assert sr.host_element is host_element


class TestShadowRootInnerHtml:
    """Tests for ShadowRoot.inner_html property."""

    @pytest.mark.asyncio
    async def test_inner_html(self, shadow_root):
        shadow_root._connection_handler.execute_command.return_value = {
            'result': {'outerHTML': '<div class="internal">Hello</div>'}
        }
        html = await shadow_root.inner_html
        assert html == '<div class="internal">Hello</div>'
        shadow_root._connection_handler.execute_command.assert_called_once()

    @pytest.mark.asyncio
    async def test_inner_html_empty(self, shadow_root):
        shadow_root._connection_handler.execute_command.return_value = {
            'result': {'outerHTML': ''}
        }
        html = await shadow_root.inner_html
        assert html == ''


class TestShadowRootRepr:
    """Tests for ShadowRoot string representations."""

    def test_repr(self, shadow_root):
        result = repr(shadow_root)
        assert 'ShadowRoot' in result
        assert 'open' in result
        assert 'shadow-root-object-id' in result

    def test_str(self, shadow_root):
        result = str(shadow_root)
        assert result == 'ShadowRoot(open)'

    def test_str_closed(self, mock_connection_handler):
        sr = ShadowRoot(
            object_id='sr-id',
            connection_handler=mock_connection_handler,
            mode=ShadowRootType.CLOSED,
        )
        assert str(sr) == 'ShadowRoot(closed)'


class TestShadowRootFindElements:
    """Tests for element finding within shadow root (CSS only)."""

    @pytest.mark.asyncio
    async def test_find_raises_not_implemented(self, shadow_root):
        """find() should raise NotImplementedError on ShadowRoot."""
        with pytest.raises(NotImplementedError, match='find\\(\\) is not supported on ShadowRoot'):
            await shadow_root.find(class_name='btn-primary')

    @pytest.mark.asyncio
    async def test_query_xpath_raises_not_implemented(self, shadow_root):
        """query() with XPath should raise NotImplementedError on ShadowRoot."""
        with pytest.raises(NotImplementedError, match='XPath is not supported on ShadowRoot'):
            await shadow_root.query('.//button')

    @pytest.mark.asyncio
    async def test_query_css_in_shadow_root(self, shadow_root):
        """query() should work with CSS selectors inside shadow root."""
        evaluate_response = {
            'result': {'result': {'objectId': 'queried-element-id'}}
        }
        describe_response = {
            'result': {
                'node': {
                    'nodeName': 'INPUT',
                    'attributes': ['type', 'email', 'name', 'user-email'],
                }
            }
        }
        shadow_root._connection_handler.execute_command.side_effect = [
            evaluate_response,
            describe_response,
        ]

        element = await shadow_root.query('input[type="email"]')

        assert isinstance(element, WebElement)
        assert element._object_id == 'queried-element-id'


class TestWebElementGetShadowRoot:
    """Tests for WebElement.get_shadow_root()."""

    @pytest.mark.asyncio
    async def test_get_shadow_root_success(self, host_element):
        """get_shadow_root() should return ShadowRoot when shadow root exists."""
        describe_response = {
            'result': {
                'node': {
                    'nodeName': 'DIV',
                    'attributes': ['id', 'host'],
                    'shadowRoots': [
                        {
                            'backendNodeId': 42,
                            'shadowRootType': 'open',
                        }
                    ],
                }
            }
        }
        resolve_response = {
            'result': {
                'object': {'objectId': 'shadow-root-resolved-id'}
            }
        }
        host_element._connection_handler.execute_command.side_effect = [
            describe_response,
            resolve_response,
        ]

        shadow_root = await host_element.get_shadow_root()

        assert isinstance(shadow_root, ShadowRoot)
        assert shadow_root._object_id == 'shadow-root-resolved-id'
        assert shadow_root.mode == ShadowRootType.OPEN
        assert shadow_root.host_element is host_element

    @pytest.mark.asyncio
    async def test_get_shadow_root_closed_mode(self, host_element):
        """get_shadow_root() should handle closed shadow roots."""
        describe_response = {
            'result': {
                'node': {
                    'nodeName': 'DIV',
                    'attributes': [],
                    'shadowRoots': [
                        {
                            'backendNodeId': 99,
                            'shadowRootType': 'closed',
                        }
                    ],
                }
            }
        }
        resolve_response = {
            'result': {
                'object': {'objectId': 'closed-shadow-id'}
            }
        }
        host_element._connection_handler.execute_command.side_effect = [
            describe_response,
            resolve_response,
        ]

        shadow_root = await host_element.get_shadow_root()

        assert shadow_root.mode == ShadowRootType.CLOSED

    @pytest.mark.asyncio
    async def test_get_shadow_root_not_found(self, host_element):
        """get_shadow_root() should raise ShadowRootNotFound when no shadow root."""
        describe_response = {
            'result': {
                'node': {
                    'nodeName': 'DIV',
                    'attributes': ['id', 'no-shadow'],
                }
            }
        }
        host_element._connection_handler.execute_command.return_value = describe_response

        with pytest.raises(ShadowRootNotFound):
            await host_element.get_shadow_root()

    @pytest.mark.asyncio
    async def test_get_shadow_root_empty_shadow_roots_list(self, host_element):
        """get_shadow_root() should raise when shadowRoots is empty list."""
        describe_response = {
            'result': {
                'node': {
                    'nodeName': 'DIV',
                    'attributes': [],
                    'shadowRoots': [],
                }
            }
        }
        host_element._connection_handler.execute_command.return_value = describe_response

        with pytest.raises(ShadowRootNotFound):
            await host_element.get_shadow_root()

    @pytest.mark.asyncio
    async def test_get_shadow_root_no_node_id(self, host_element):
        """get_shadow_root() should raise when shadow root has no nodeId."""
        describe_response = {
            'result': {
                'node': {
                    'nodeName': 'DIV',
                    'attributes': [],
                    'shadowRoots': [
                        {
                            'shadowRootType': 'open',
                        }
                    ],
                }
            }
        }
        host_element._connection_handler.execute_command.return_value = describe_response

        with pytest.raises(ShadowRootNotFound):
            await host_element.get_shadow_root()


# --- Tab.find_shadow_roots() tests ---


@pytest_asyncio.fixture
async def tab_connection_handler():
    """Mock connection handler for Tab tests."""
    with patch('pydoll.connection.ConnectionHandler', autospec=True) as mock:
        handler = mock.return_value
        handler.execute_command = AsyncMock()
        handler.register_callback = AsyncMock()
        handler.remove_callback = AsyncMock()
        handler.clear_callbacks = AsyncMock()
        handler.network_logs = []
        handler.dialog = None
        handler._connection_port = 9222
        yield handler


@pytest_asyncio.fixture
async def tab(tab_connection_handler):
    """Tab fixture with mocked dependencies."""
    browser = MagicMock()
    browser.options = MagicMock()
    with patch('pydoll.browser.tab.ConnectionHandler', return_value=tab_connection_handler):
        return Tab(
            browser=browser,
            connection_port=9222,
            target_id=f'test-target-{uuid.uuid4().hex[:8]}',
        )


class TestTabFindShadowRoots:
    """Tests for Tab.find_shadow_roots()."""

    @pytest.mark.asyncio
    async def test_find_shadow_roots_single(self, tab):
        """Should return a single shadow root found in the page."""
        get_doc_response = {
            'result': {
                'root': {
                    'nodeId': 1,
                    'backendNodeId': 1,
                    'nodeName': '#document',
                    'children': [
                        {
                            'nodeId': 2,
                            'backendNodeId': 2,
                            'nodeName': 'HTML',
                            'children': [
                                {
                                    'nodeId': 3,
                                    'backendNodeId': 3,
                                    'nodeName': 'BODY',
                                    'children': [
                                        {
                                            'nodeId': 4,
                                            'backendNodeId': 10,
                                            'nodeName': 'DIV',
                                            'attributes': ['id', 'host'],
                                            'shadowRoots': [
                                                {
                                                    'nodeId': 5,
                                                    'backendNodeId': 20,
                                                    'shadowRootType': 'open',
                                                    'children': [],
                                                }
                                            ],
                                        }
                                    ],
                                }
                            ],
                        }
                    ],
                }
            }
        }
        tab._connection_handler.execute_command.side_effect = [
            get_doc_response,
            {'result': {'object': {'objectId': 'shadow-obj-1'}}},
            {'result': {'object': {'objectId': 'host-obj-1'}}},
            {'result': {'node': {'nodeName': 'DIV', 'attributes': ['id', 'host']}}},
        ]

        result = await tab.find_shadow_roots()

        assert len(result) == 1
        assert isinstance(result[0], ShadowRoot)
        assert result[0]._object_id == 'shadow-obj-1'
        assert result[0].mode == ShadowRootType.OPEN
        assert result[0].host_element is not None
        assert result[0].host_element._object_id == 'host-obj-1'

    @pytest.mark.asyncio
    async def test_find_shadow_roots_none_found(self, tab):
        """Should return empty list when no shadow roots exist."""
        get_doc_response = {
            'result': {
                'root': {
                    'nodeId': 1,
                    'backendNodeId': 1,
                    'nodeName': '#document',
                    'children': [
                        {
                            'nodeId': 2,
                            'backendNodeId': 2,
                            'nodeName': 'HTML',
                            'children': [],
                        }
                    ],
                }
            }
        }
        tab._connection_handler.execute_command.return_value = get_doc_response

        result = await tab.find_shadow_roots()

        assert result == []

    @pytest.mark.asyncio
    async def test_find_shadow_roots_multiple(self, tab):
        """Should return multiple shadow roots at different depths."""
        get_doc_response = {
            'result': {
                'root': {
                    'nodeId': 1,
                    'backendNodeId': 1,
                    'nodeName': '#document',
                    'children': [
                        {
                            'nodeId': 2,
                            'backendNodeId': 2,
                            'nodeName': 'HTML',
                            'children': [
                                {
                                    'nodeId': 3,
                                    'backendNodeId': 10,
                                    'nodeName': 'DIV',
                                    'shadowRoots': [
                                        {
                                            'nodeId': 4,
                                            'backendNodeId': 20,
                                            'shadowRootType': 'open',
                                            'children': [],
                                        }
                                    ],
                                },
                                {
                                    'nodeId': 5,
                                    'backendNodeId': 11,
                                    'nodeName': 'CUSTOM-ELEMENT',
                                    'shadowRoots': [
                                        {
                                            'nodeId': 6,
                                            'backendNodeId': 30,
                                            'shadowRootType': 'closed',
                                            'children': [],
                                        }
                                    ],
                                },
                            ],
                        }
                    ],
                }
            }
        }
        tab._connection_handler.execute_command.side_effect = [
            get_doc_response,
            {'result': {'object': {'objectId': 'shadow-obj-1'}}},
            {'result': {'object': {'objectId': 'host-obj-1'}}},
            {'result': {'node': {'nodeName': 'DIV', 'attributes': ['id', 'host1']}}},
            {'result': {'object': {'objectId': 'shadow-obj-2'}}},
            {'result': {'object': {'objectId': 'host-obj-2'}}},
            {'result': {'node': {'nodeName': 'CUSTOM-ELEMENT', 'attributes': []}}},
        ]

        result = await tab.find_shadow_roots()

        assert len(result) == 2
        assert result[0].mode == ShadowRootType.OPEN
        assert result[1].mode == ShadowRootType.CLOSED

    @pytest.mark.asyncio
    async def test_find_shadow_roots_nested_in_shadow_root(self, tab):
        """Should find shadow roots nested inside other shadow roots."""
        get_doc_response = {
            'result': {
                'root': {
                    'nodeId': 1,
                    'backendNodeId': 1,
                    'nodeName': '#document',
                    'children': [
                        {
                            'nodeId': 2,
                            'backendNodeId': 10,
                            'nodeName': 'DIV',
                            'shadowRoots': [
                                {
                                    'nodeId': 3,
                                    'backendNodeId': 20,
                                    'shadowRootType': 'open',
                                    'children': [
                                        {
                                            'nodeId': 4,
                                            'backendNodeId': 11,
                                            'nodeName': 'INNER-HOST',
                                            'shadowRoots': [
                                                {
                                                    'nodeId': 5,
                                                    'backendNodeId': 30,
                                                    'shadowRootType': 'closed',
                                                    'children': [],
                                                }
                                            ],
                                        }
                                    ],
                                }
                            ],
                        }
                    ],
                }
            }
        }
        tab._connection_handler.execute_command.side_effect = [
            get_doc_response,
            {'result': {'object': {'objectId': 'shadow-outer'}}},
            {'result': {'object': {'objectId': 'host-outer'}}},
            {'result': {'node': {'nodeName': 'DIV', 'attributes': []}}},
            {'result': {'object': {'objectId': 'shadow-inner'}}},
            {'result': {'object': {'objectId': 'host-inner'}}},
            {'result': {'node': {'nodeName': 'INNER-HOST', 'attributes': []}}},
        ]

        result = await tab.find_shadow_roots()

        assert len(result) == 2
        assert result[0]._object_id == 'shadow-outer'
        assert result[1]._object_id == 'shadow-inner'

    @pytest.mark.asyncio
    async def test_find_shadow_roots_in_iframe(self, tab):
        """Should find shadow roots inside iframe content documents."""
        get_doc_response = {
            'result': {
                'root': {
                    'nodeId': 1,
                    'backendNodeId': 1,
                    'nodeName': '#document',
                    'children': [
                        {
                            'nodeId': 2,
                            'backendNodeId': 2,
                            'nodeName': 'HTML',
                            'children': [
                                {
                                    'nodeId': 3,
                                    'backendNodeId': 3,
                                    'nodeName': 'IFRAME',
                                    'contentDocument': {
                                        'nodeId': 4,
                                        'backendNodeId': 4,
                                        'nodeName': '#document',
                                        'children': [
                                            {
                                                'nodeId': 5,
                                                'backendNodeId': 15,
                                                'nodeName': 'BODY',
                                                'shadowRoots': [
                                                    {
                                                        'nodeId': 6,
                                                        'backendNodeId': 25,
                                                        'shadowRootType': 'closed',
                                                        'children': [],
                                                    }
                                                ],
                                            }
                                        ],
                                    },
                                }
                            ],
                        }
                    ],
                }
            }
        }
        tab._connection_handler.execute_command.side_effect = [
            get_doc_response,
            {'result': {'object': {'objectId': 'iframe-shadow-obj'}}},
            {'result': {'object': {'objectId': 'iframe-host-obj'}}},
            {'result': {'node': {'nodeName': 'BODY', 'attributes': []}}},
        ]

        result = await tab.find_shadow_roots()

        assert len(result) == 1
        assert result[0]._object_id == 'iframe-shadow-obj'
        assert result[0].mode == ShadowRootType.CLOSED

    @pytest.mark.asyncio
    async def test_find_shadow_roots_skips_unresolvable(self, tab):
        """Should skip shadow roots that fail to resolve."""
        get_doc_response = {
            'result': {
                'root': {
                    'nodeId': 1,
                    'backendNodeId': 1,
                    'nodeName': '#document',
                    'children': [
                        {
                            'nodeId': 2,
                            'backendNodeId': 10,
                            'nodeName': 'DIV',
                            'shadowRoots': [
                                {
                                    'nodeId': 3,
                                    'backendNodeId': 20,
                                    'shadowRootType': 'open',
                                    'children': [],
                                }
                            ],
                        },
                        {
                            'nodeId': 4,
                            'backendNodeId': 11,
                            'nodeName': 'OTHER',
                            'shadowRoots': [
                                {
                                    'nodeId': 5,
                                    'backendNodeId': 30,
                                    'shadowRootType': 'open',
                                    'children': [],
                                }
                            ],
                        },
                    ],
                }
            }
        }
        tab._connection_handler.execute_command.side_effect = [
            get_doc_response,
            {'result': {'object': {'objectId': 'shadow-ok'}}},
            {'result': {'object': {'objectId': 'host-ok'}}},
            {'result': {'node': {'nodeName': 'DIV', 'attributes': []}}},
            CommandExecutionTimeout(),
        ]

        result = await tab.find_shadow_roots()

        assert len(result) == 1
        assert result[0]._object_id == 'shadow-ok'

    @pytest.mark.asyncio
    async def test_find_shadow_roots_host_resolution_fails_gracefully(self, tab):
        """Shadow root should still be returned when host resolution fails."""
        get_doc_response = {
            'result': {
                'root': {
                    'nodeId': 1,
                    'backendNodeId': 1,
                    'nodeName': '#document',
                    'children': [
                        {
                            'nodeId': 2,
                            'backendNodeId': 10,
                            'nodeName': 'DIV',
                            'shadowRoots': [
                                {
                                    'nodeId': 3,
                                    'backendNodeId': 20,
                                    'shadowRootType': 'open',
                                    'children': [],
                                }
                            ],
                        }
                    ],
                }
            }
        }
        tab._connection_handler.execute_command.side_effect = [
            get_doc_response,
            {'result': {'object': {'objectId': 'shadow-obj'}}},
            CommandExecutionTimeout(),
        ]

        result = await tab.find_shadow_roots()

        assert len(result) == 1
        assert result[0]._object_id == 'shadow-obj'
        assert result[0].host_element is None

    @pytest.mark.asyncio
    async def test_find_shadow_roots_skips_missing_backend_id(self, tab):
        """Should skip shadow roots without backendNodeId."""
        get_doc_response = {
            'result': {
                'root': {
                    'nodeId': 1,
                    'backendNodeId': 1,
                    'nodeName': '#document',
                    'children': [
                        {
                            'nodeId': 2,
                            'backendNodeId': 10,
                            'nodeName': 'DIV',
                            'shadowRoots': [
                                {
                                    'shadowRootType': 'open',
                                    'children': [],
                                }
                            ],
                        }
                    ],
                }
            }
        }
        tab._connection_handler.execute_command.return_value = get_doc_response

        result = await tab.find_shadow_roots()

        assert result == []


class TestCollectShadowRootsFromTree:
    """Tests for the _collect_shadow_roots_from_tree static helper."""

    def test_empty_tree(self):
        results = []
        Tab._collect_shadow_roots_from_tree({}, results)
        assert results == []

    def test_no_shadow_roots(self):
        tree = {
            'nodeId': 1,
            'backendNodeId': 1,
            'children': [
                {'nodeId': 2, 'backendNodeId': 2},
            ],
        }
        results = []
        Tab._collect_shadow_roots_from_tree(tree, results)
        assert results == []

    def test_collects_shadow_root(self):
        shadow = {'backendNodeId': 20, 'shadowRootType': 'open', 'children': []}
        tree = {
            'backendNodeId': 10,
            'shadowRoots': [shadow],
        }
        results = []
        Tab._collect_shadow_roots_from_tree(tree, results)
        assert len(results) == 1
        assert results[0] == (shadow, 10)

    def test_collects_from_content_document(self):
        shadow = {'backendNodeId': 30, 'shadowRootType': 'closed', 'children': []}
        tree = {
            'backendNodeId': 1,
            'children': [
                {
                    'backendNodeId': 2,
                    'nodeName': 'IFRAME',
                    'contentDocument': {
                        'backendNodeId': 3,
                        'children': [
                            {
                                'backendNodeId': 15,
                                'shadowRoots': [shadow],
                            }
                        ],
                    },
                }
            ],
        }
        results = []
        Tab._collect_shadow_roots_from_tree(tree, results)
        assert len(results) == 1
        assert results[0] == (shadow, 15)

    def test_collects_nested_shadow_roots(self):
        inner_shadow = {'backendNodeId': 40, 'shadowRootType': 'closed', 'children': []}
        outer_shadow = {
            'backendNodeId': 20,
            'shadowRootType': 'open',
            'children': [
                {
                    'backendNodeId': 30,
                    'shadowRoots': [inner_shadow],
                }
            ],
        }
        tree = {
            'backendNodeId': 10,
            'shadowRoots': [outer_shadow],
        }
        results = []
        Tab._collect_shadow_roots_from_tree(tree, results)
        assert len(results) == 2
        assert results[0] == (outer_shadow, 10)
        assert results[1] == (inner_shadow, 30)


class TestTabFindShadowRootsDeep:
    """Tests for Tab.find_shadow_roots(deep=True) — OOPIF traversal."""

    @pytest.mark.asyncio
    async def test_deep_false_same_as_default(self, tab):
        """deep=False should behave identically to the default (no OOPIF traversal)."""
        get_doc_response = {
            'result': {
                'root': {
                    'nodeId': 1,
                    'backendNodeId': 1,
                    'nodeName': '#document',
                    'children': [
                        {
                            'nodeId': 2,
                            'backendNodeId': 10,
                            'nodeName': 'DIV',
                            'shadowRoots': [
                                {
                                    'nodeId': 3,
                                    'backendNodeId': 20,
                                    'shadowRootType': 'open',
                                    'children': [],
                                }
                            ],
                        }
                    ],
                }
            }
        }
        tab._connection_handler.execute_command.side_effect = [
            get_doc_response,
            {'result': {'object': {'objectId': 'shadow-obj-1'}}},
            {'result': {'object': {'objectId': 'host-obj-1'}}},
            {'result': {'node': {'nodeName': 'DIV', 'attributes': ['id', 'host']}}},
        ]

        result = await tab.find_shadow_roots(deep=False)

        assert len(result) == 1
        assert result[0]._object_id == 'shadow-obj-1'

    @pytest.mark.asyncio
    async def test_deep_collects_oopif_shadow_roots(self, tab):
        """deep=True should discover shadow roots inside OOPIF targets."""
        # Main doc has no shadow roots
        get_doc_response = {
            'result': {
                'root': {
                    'nodeId': 1,
                    'backendNodeId': 1,
                    'nodeName': '#document',
                    'children': [],
                }
            }
        }
        tab._connection_handler.execute_command.return_value = get_doc_response

        # Mock the browser-level ConnectionHandler used in _collect_oopif_shadow_roots
        mock_browser_handler = AsyncMock()
        mock_browser_handler.execute_command = AsyncMock()
        mock_browser_handler.execute_command.side_effect = [
            # Target.getTargets
            {
                'result': {
                    'targetInfos': [
                        {'targetId': 'oopif-1', 'type': 'iframe', 'url': 'https://cf.example.com'},
                    ]
                }
            },
            # Target.attachToTarget
            {'result': {'sessionId': 'session-1'}},
            # DOM.getDocument (in OOPIF)
            {
                'result': {
                    'root': {
                        'nodeId': 1,
                        'backendNodeId': 100,
                        'nodeName': '#document',
                        'children': [
                            {
                                'nodeId': 2,
                                'backendNodeId': 200,
                                'nodeName': 'BODY',
                                'shadowRoots': [
                                    {
                                        'nodeId': 3,
                                        'backendNodeId': 300,
                                        'shadowRootType': 'closed',
                                        'children': [],
                                    }
                                ],
                            }
                        ],
                    }
                }
            },
            # DOM.resolveNode (shadow root)
            {'result': {'object': {'objectId': 'oopif-shadow-obj'}}},
            # DOM.resolveNode (host element)
            {'result': {'object': {'objectId': 'oopif-host-obj'}}},
            # DOM.describeNode (host element attrs)
            {'result': {'node': {'nodeName': 'BODY', 'attributes': []}}},
        ]

        with patch('pydoll.browser.tab.ConnectionHandler', return_value=mock_browser_handler):
            result = await tab.find_shadow_roots(deep=True)

        assert len(result) == 1
        sr = result[0]
        assert sr._object_id == 'oopif-shadow-obj'
        assert sr.mode == ShadowRootType.CLOSED
        assert sr.host_element is not None
        assert sr.host_element._object_id == 'oopif-host-obj'

    @pytest.mark.asyncio
    async def test_deep_no_oopif_targets(self, tab):
        """deep=True with no iframe targets returns only main-doc roots."""
        get_doc_response = {
            'result': {
                'root': {
                    'nodeId': 1,
                    'backendNodeId': 1,
                    'nodeName': '#document',
                    'children': [],
                }
            }
        }
        tab._connection_handler.execute_command.return_value = get_doc_response

        mock_browser_handler = AsyncMock()
        mock_browser_handler.execute_command = AsyncMock()
        mock_browser_handler.execute_command.return_value = {
            'result': {'targetInfos': []}
        }

        with patch('pydoll.browser.tab.ConnectionHandler', return_value=mock_browser_handler):
            result = await tab.find_shadow_roots(deep=True)

        assert result == []

    @pytest.mark.asyncio
    async def test_deep_oopif_attachment_fails_gracefully(self, tab):
        """When an OOPIF target fails to attach, others should still be collected."""
        get_doc_response = {
            'result': {
                'root': {
                    'nodeId': 1,
                    'backendNodeId': 1,
                    'nodeName': '#document',
                    'children': [],
                }
            }
        }
        tab._connection_handler.execute_command.return_value = get_doc_response

        mock_browser_handler = AsyncMock()
        mock_browser_handler.execute_command = AsyncMock()
        mock_browser_handler.execute_command.side_effect = [
            # Target.getTargets — two iframe targets
            {
                'result': {
                    'targetInfos': [
                        {'targetId': 'fail-target', 'type': 'iframe', 'url': 'https://a.com'},
                        {'targetId': 'ok-target', 'type': 'iframe', 'url': 'https://b.com'},
                    ]
                }
            },
            # First target: attachment fails
            WebSocketConnectionClosed(),
            # Second target: attachment succeeds
            {'result': {'sessionId': 'session-ok'}},
            # DOM.getDocument for second target
            {
                'result': {
                    'root': {
                        'nodeId': 1,
                        'backendNodeId': 50,
                        'nodeName': '#document',
                        'children': [
                            {
                                'nodeId': 2,
                                'backendNodeId': 60,
                                'nodeName': 'DIV',
                                'shadowRoots': [
                                    {
                                        'nodeId': 3,
                                        'backendNodeId': 70,
                                        'shadowRootType': 'open',
                                        'children': [],
                                    }
                                ],
                            }
                        ],
                    }
                }
            },
            # DOM.resolveNode (shadow root)
            {'result': {'object': {'objectId': 'sr-from-ok-target'}}},
            # DOM.resolveNode (host element)
            {'result': {'object': {'objectId': 'host-from-ok-target'}}},
            # DOM.describeNode (host attrs)
            {'result': {'node': {'nodeName': 'DIV', 'attributes': ['id', 'widget']}}},
        ]

        with patch('pydoll.browser.tab.ConnectionHandler', return_value=mock_browser_handler):
            result = await tab.find_shadow_roots(deep=True)

        assert len(result) == 1
        assert result[0]._object_id == 'sr-from-ok-target'

    @pytest.mark.asyncio
    async def test_deep_oopif_shadow_root_has_routing_context(self, tab):
        """ShadowRoot from OOPIF should have _iframe_context with correct routing."""
        get_doc_response = {
            'result': {
                'root': {
                    'nodeId': 1,
                    'backendNodeId': 1,
                    'nodeName': '#document',
                    'children': [],
                }
            }
        }
        tab._connection_handler.execute_command.return_value = get_doc_response

        mock_browser_handler = AsyncMock()
        mock_browser_handler.execute_command = AsyncMock()
        mock_browser_handler.execute_command.side_effect = [
            # Target.getTargets
            {
                'result': {
                    'targetInfos': [
                        {'targetId': 'oopif-42', 'type': 'iframe', 'url': 'https://cf.example.com'},
                    ]
                }
            },
            # Target.attachToTarget
            {'result': {'sessionId': 'sess-42'}},
            # DOM.getDocument
            {
                'result': {
                    'root': {
                        'nodeId': 1,
                        'backendNodeId': 100,
                        'nodeName': '#document',
                        'children': [
                            {
                                'nodeId': 2,
                                'backendNodeId': 200,
                                'nodeName': 'DIV',
                                'shadowRoots': [
                                    {
                                        'nodeId': 3,
                                        'backendNodeId': 300,
                                        'shadowRootType': 'closed',
                                        'children': [],
                                    }
                                ],
                            }
                        ],
                    }
                }
            },
            # DOM.resolveNode (shadow root)
            {'result': {'object': {'objectId': 'sr-obj-42'}}},
            # DOM.resolveNode (host element)
            {'result': {'object': {'objectId': 'host-obj-42'}}},
            # DOM.describeNode (host attrs)
            {'result': {'node': {'nodeName': 'DIV', 'attributes': ['class', 'turnstile']}}},
        ]

        with patch('pydoll.browser.tab.ConnectionHandler', return_value=mock_browser_handler):
            result = await tab.find_shadow_roots(deep=True)

        assert len(result) == 1
        sr = result[0]

        # Verify the ShadowRoot inherited IFrameContext from host
        ctx = getattr(sr, '_iframe_context', None)
        assert ctx is not None
        assert isinstance(ctx, IFrameContext)
        assert ctx.frame_id == 'oopif-42'
        assert ctx.session_id == 'sess-42'
        assert ctx.session_handler is mock_browser_handler

    @pytest.mark.asyncio
    async def test_deep_combines_main_and_oopif_roots(self, tab):
        """deep=True should return both main-doc and OOPIF shadow roots."""
        # Main doc has one shadow root
        get_doc_response = {
            'result': {
                'root': {
                    'nodeId': 1,
                    'backendNodeId': 1,
                    'nodeName': '#document',
                    'children': [
                        {
                            'nodeId': 2,
                            'backendNodeId': 10,
                            'nodeName': 'DIV',
                            'shadowRoots': [
                                {
                                    'nodeId': 3,
                                    'backendNodeId': 20,
                                    'shadowRootType': 'open',
                                    'children': [],
                                }
                            ],
                        }
                    ],
                }
            }
        }
        tab._connection_handler.execute_command.side_effect = [
            get_doc_response,
            # resolve shadow root
            {'result': {'object': {'objectId': 'main-shadow'}}},
            # resolve host
            {'result': {'object': {'objectId': 'main-host'}}},
            # describe host
            {'result': {'node': {'nodeName': 'DIV', 'attributes': ['id', 'main']}}},
        ]

        mock_browser_handler = AsyncMock()
        mock_browser_handler.execute_command = AsyncMock()
        mock_browser_handler.execute_command.side_effect = [
            # Target.getTargets
            {
                'result': {
                    'targetInfos': [
                        {'targetId': 'oopif-1', 'type': 'iframe', 'url': 'https://cf.example.com'},
                    ]
                }
            },
            # Target.attachToTarget
            {'result': {'sessionId': 'session-1'}},
            # DOM.getDocument
            {
                'result': {
                    'root': {
                        'nodeId': 1,
                        'backendNodeId': 50,
                        'nodeName': '#document',
                        'children': [
                            {
                                'nodeId': 2,
                                'backendNodeId': 60,
                                'nodeName': 'BODY',
                                'shadowRoots': [
                                    {
                                        'nodeId': 3,
                                        'backendNodeId': 70,
                                        'shadowRootType': 'closed',
                                        'children': [],
                                    }
                                ],
                            }
                        ],
                    }
                }
            },
            # DOM.resolveNode (shadow root)
            {'result': {'object': {'objectId': 'oopif-shadow'}}},
            # DOM.resolveNode (host)
            {'result': {'object': {'objectId': 'oopif-host'}}},
            # DOM.describeNode (host attrs)
            {'result': {'node': {'nodeName': 'BODY', 'attributes': []}}},
        ]

        with patch('pydoll.browser.tab.ConnectionHandler', return_value=mock_browser_handler):
            result = await tab.find_shadow_roots(deep=True)

        assert len(result) == 2
        assert result[0]._object_id == 'main-shadow'
        assert result[0].mode == ShadowRootType.OPEN
        assert result[1]._object_id == 'oopif-shadow'
        assert result[1].mode == ShadowRootType.CLOSED

    @pytest.mark.asyncio
    async def test_deep_oopif_no_host_sets_iframe_context_on_shadow_root(self, tab):
        """When host resolution fails, IFrameContext should be set directly on ShadowRoot."""
        get_doc_response = {
            'result': {
                'root': {
                    'nodeId': 1,
                    'backendNodeId': 1,
                    'nodeName': '#document',
                    'children': [],
                }
            }
        }
        tab._connection_handler.execute_command.return_value = get_doc_response

        mock_browser_handler = AsyncMock()
        mock_browser_handler.execute_command = AsyncMock()
        mock_browser_handler.execute_command.side_effect = [
            # Target.getTargets
            {
                'result': {
                    'targetInfos': [
                        {'targetId': 'oopif-99', 'type': 'iframe', 'url': 'https://cf.example.com'},
                    ]
                }
            },
            # Target.attachToTarget
            {'result': {'sessionId': 'sess-99'}},
            # DOM.getDocument
            {
                'result': {
                    'root': {
                        'nodeId': 1,
                        'backendNodeId': 100,
                        'nodeName': '#document',
                        'children': [
                            {
                                'nodeId': 2,
                                'backendNodeId': 200,
                                'nodeName': 'DIV',
                                'shadowRoots': [
                                    {
                                        'nodeId': 3,
                                        'backendNodeId': 300,
                                        'shadowRootType': 'open',
                                        'children': [],
                                    }
                                ],
                            }
                        ],
                    }
                }
            },
            # DOM.resolveNode (shadow root) - success
            {'result': {'object': {'objectId': 'sr-obj-99'}}},
            # DOM.resolveNode (host element) - fails
            CommandExecutionTimeout(),
        ]

        with patch('pydoll.browser.tab.ConnectionHandler', return_value=mock_browser_handler):
            result = await tab.find_shadow_roots(deep=True)

        assert len(result) == 1
        sr = result[0]
        assert sr.host_element is None
        # IFrameContext set directly on ShadowRoot since no host
        ctx = getattr(sr, '_iframe_context', None)
        assert ctx is not None
        assert ctx.frame_id == 'oopif-99'
        assert ctx.session_id == 'sess-99'


class TestTabFindShadowRootsTimeout:
    """Tests for Tab.find_shadow_roots(timeout=...) — polling behavior."""

    @pytest.mark.asyncio
    async def test_timeout_zero_returns_immediately(self, tab):
        """timeout=0 (default) should return immediately without polling."""
        get_doc_response = {
            'result': {
                'root': {
                    'nodeId': 1,
                    'backendNodeId': 1,
                    'nodeName': '#document',
                    'children': [],
                }
            }
        }
        tab._connection_handler.execute_command.return_value = get_doc_response

        result = await tab.find_shadow_roots(timeout=0)

        assert result == []

    @pytest.mark.asyncio
    async def test_timeout_raises_when_no_shadow_roots_found(self, tab):
        """Should raise WaitElementTimeout when no shadow roots appear within timeout."""
        get_doc_response = {
            'result': {
                'root': {
                    'nodeId': 1,
                    'backendNodeId': 1,
                    'nodeName': '#document',
                    'children': [],
                }
            }
        }
        tab._connection_handler.execute_command.return_value = get_doc_response

        with pytest.raises(WaitElementTimeout):
            await tab.find_shadow_roots(timeout=1)

    @pytest.mark.asyncio
    async def test_timeout_returns_when_shadow_roots_appear(self, tab):
        """Should return shadow roots as soon as they appear during polling."""
        empty_doc = {
            'result': {
                'root': {
                    'nodeId': 1,
                    'backendNodeId': 1,
                    'nodeName': '#document',
                    'children': [],
                }
            }
        }
        doc_with_shadow = {
            'result': {
                'root': {
                    'nodeId': 1,
                    'backendNodeId': 1,
                    'nodeName': '#document',
                    'children': [
                        {
                            'nodeId': 2,
                            'backendNodeId': 10,
                            'nodeName': 'DIV',
                            'shadowRoots': [
                                {
                                    'nodeId': 3,
                                    'backendNodeId': 20,
                                    'shadowRootType': 'open',
                                    'children': [],
                                }
                            ],
                        }
                    ],
                }
            }
        }
        tab._connection_handler.execute_command.side_effect = [
            # First poll: empty
            empty_doc,
            # Second poll: shadow root appears
            doc_with_shadow,
            # resolve shadow root
            {'result': {'object': {'objectId': 'shadow-obj'}}},
            # resolve host
            {'result': {'object': {'objectId': 'host-obj'}}},
            # describe host attrs
            {'result': {'node': {'nodeName': 'DIV', 'attributes': ['id', 'host']}}},
        ]

        result = await tab.find_shadow_roots(timeout=5)

        assert len(result) == 1
        assert result[0]._object_id == 'shadow-obj'

    @pytest.mark.asyncio
    async def test_timeout_with_deep_waits_for_oopif_roots(self, tab):
        """timeout + deep=True should poll until OOPIF shadow roots appear."""
        empty_doc = {
            'result': {
                'root': {
                    'nodeId': 1,
                    'backendNodeId': 1,
                    'nodeName': '#document',
                    'children': [],
                }
            }
        }
        tab._connection_handler.execute_command.return_value = empty_doc

        call_count = 0

        async def browser_side_effect(cmd, **kwargs):
            nonlocal call_count
            call_count += 1
            # First cycle: no iframe targets
            if call_count == 1:
                return {'result': {'targetInfos': []}}
            # Second cycle: iframe target appears
            if call_count == 2:
                return {
                    'result': {
                        'targetInfos': [
                            {'targetId': 'oopif-1', 'type': 'iframe', 'url': 'https://cf.test'},
                        ]
                    }
                }
            if call_count == 3:
                return {'result': {'sessionId': 'sess-1'}}
            if call_count == 4:
                return {
                    'result': {
                        'root': {
                            'nodeId': 1,
                            'backendNodeId': 100,
                            'nodeName': '#document',
                            'children': [
                                {
                                    'nodeId': 2,
                                    'backendNodeId': 200,
                                    'nodeName': 'BODY',
                                    'shadowRoots': [
                                        {
                                            'nodeId': 3,
                                            'backendNodeId': 300,
                                            'shadowRootType': 'closed',
                                            'children': [],
                                        }
                                    ],
                                }
                            ],
                        }
                    }
                }
            if call_count == 5:
                return {'result': {'object': {'objectId': 'oopif-sr-obj'}}}
            if call_count == 6:
                return {'result': {'object': {'objectId': 'oopif-host-obj'}}}
            if call_count == 7:
                return {'result': {'node': {'nodeName': 'BODY', 'attributes': []}}}
            return {}

        mock_browser_handler = AsyncMock()
        mock_browser_handler.execute_command = AsyncMock(side_effect=browser_side_effect)

        with patch('pydoll.browser.tab.ConnectionHandler', return_value=mock_browser_handler):
            result = await tab.find_shadow_roots(deep=True, timeout=5)

        assert len(result) == 1
        assert result[0]._object_id == 'oopif-sr-obj'
        assert result[0].mode == ShadowRootType.CLOSED


# --- WebElement.get_shadow_root(timeout=...) tests ---


class TestGetShadowRootTimeout:
    """Tests for WebElement.get_shadow_root(timeout=...) — polling behavior."""

    @pytest.mark.asyncio
    async def test_timeout_zero_raises_immediately(self, mock_connection_handler):
        """timeout=0 (default) should raise ShadowRootNotFound immediately."""
        element = WebElement('elem-obj-1', mock_connection_handler)
        mock_connection_handler.execute_command.return_value = {
            'result': {
                'node': {
                    'nodeId': 1,
                    'backendNodeId': 10,
                    'nodeName': 'DIV',
                }
            }
        }

        with pytest.raises(ShadowRootNotFound):
            await element.get_shadow_root()

    @pytest.mark.asyncio
    async def test_timeout_raises_wait_element_timeout(self, mock_connection_handler):
        """Should raise WaitElementTimeout when shadow root doesn't appear within timeout."""
        element = WebElement('elem-obj-1', mock_connection_handler)
        mock_connection_handler.execute_command.return_value = {
            'result': {
                'node': {
                    'nodeId': 1,
                    'backendNodeId': 10,
                    'nodeName': 'DIV',
                }
            }
        }

        with pytest.raises(WaitElementTimeout):
            await element.get_shadow_root(timeout=1)

    @pytest.mark.asyncio
    async def test_timeout_returns_when_shadow_root_appears(self, mock_connection_handler):
        """Should return the shadow root as soon as it appears during polling."""
        element = WebElement('elem-obj-1', mock_connection_handler)
        no_shadow = {
            'result': {
                'node': {
                    'nodeId': 1,
                    'backendNodeId': 10,
                    'nodeName': 'DIV',
                }
            }
        }
        with_shadow = {
            'result': {
                'node': {
                    'nodeId': 1,
                    'backendNodeId': 10,
                    'nodeName': 'DIV',
                    'shadowRoots': [
                        {
                            'nodeId': 2,
                            'backendNodeId': 20,
                            'shadowRootType': 'closed',
                        }
                    ],
                }
            }
        }
        mock_connection_handler.execute_command.side_effect = [
            # First poll: no shadow root
            no_shadow,
            # Second poll: shadow root appears
            with_shadow,
            # resolve shadow root
            {'result': {'object': {'objectId': 'sr-delayed'}}},
        ]

        result = await element.get_shadow_root(timeout=5)

        assert result._object_id == 'sr-delayed'
        assert result.mode == ShadowRootType.CLOSED
        assert result.host_element is element


================================================
FILE: tests/test_shadow_root_integration.py
================================================
"""Integration tests for Shadow DOM support (open, closed, nested)."""

import asyncio
from pathlib import Path

import pytest

from pydoll.browser.chromium import Chrome
from pydoll.elements.shadow_root import ShadowRoot
from pydoll.elements.web_element import WebElement
from pydoll.exceptions import ShadowRootNotFound
from pydoll.protocol.dom.types import ShadowRootType

TEST_PAGE = f'file://{(Path(__file__).parent / "pages" / "shadow_dom_test.html").absolute()}'


class TestOpenShadowRoot:
    """Tests for open shadow root access and element finding."""

    @pytest.mark.asyncio
    async def test_get_shadow_root_open(self, ci_chrome_options):
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(TEST_PAGE)
            await asyncio.sleep(0.5)

            host = await tab.find(id='open-host')
            shadow = await host.get_shadow_root()

            assert isinstance(shadow, ShadowRoot)
            assert shadow.mode == ShadowRootType.OPEN
            assert shadow.host_element is host

    @pytest.mark.asyncio
    async def test_find_elements_in_open_shadow(self, ci_chrome_options):
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(TEST_PAGE)
            await asyncio.sleep(0.5)

            host = await tab.find(id='open-host')
            shadow = await host.get_shadow_root()

            text_el = await shadow.query('.open-text')
            assert isinstance(text_el, WebElement)
            text = await text_el.text
            assert text == 'Open shadow content'

            btn = await shadow.query('#open-btn')
            assert btn is not None

    @pytest.mark.asyncio
    async def test_query_in_open_shadow(self, ci_chrome_options):
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(TEST_PAGE)
            await asyncio.sleep(0.5)

            host = await tab.find(id='open-host')
            shadow = await host.get_shadow_root()

            input_el = await shadow.query('input[type="email"]')
            assert input_el is not None

    @pytest.mark.asyncio
    async def test_find_all_in_open_shadow(self, ci_chrome_options):
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(TEST_PAGE)
            await asyncio.sleep(0.5)

            host = await tab.find(id='open-host')
            shadow = await host.get_shadow_root()

            buttons = await shadow.query('.shadow-btn', find_all=True)
            assert len(buttons) == 1

    @pytest.mark.asyncio
    async def test_inner_html_open(self, ci_chrome_options):
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(TEST_PAGE)
            await asyncio.sleep(0.5)

            host = await tab.find(id='open-host')
            shadow = await host.get_shadow_root()

            html = await shadow.inner_html
            assert 'Open shadow content' in html


class TestClosedShadowRoot:
    """Tests for closed shadow root access via CDP bypass."""

    @pytest.mark.asyncio
    async def test_get_shadow_root_closed(self, ci_chrome_options):
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(TEST_PAGE)
            await asyncio.sleep(0.5)

            host = await tab.find(id='closed-host')
            shadow = await host.get_shadow_root()

            assert isinstance(shadow, ShadowRoot)
            assert shadow.mode == ShadowRootType.CLOSED

    @pytest.mark.asyncio
    async def test_find_elements_in_closed_shadow(self, ci_chrome_options):
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(TEST_PAGE)
            await asyncio.sleep(0.5)

            host = await tab.find(id='closed-host')
            shadow = await host.get_shadow_root()

            text_el = await shadow.query('.closed-text')
            assert isinstance(text_el, WebElement)
            text = await text_el.text
            assert text == 'Closed shadow content'

    @pytest.mark.asyncio
    async def test_query_in_closed_shadow(self, ci_chrome_options):
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(TEST_PAGE)
            await asyncio.sleep(0.5)

            host = await tab.find(id='closed-host')
            shadow = await host.get_shadow_root()

            btn = await shadow.query('#closed-btn')
            assert btn is not None

            input_el = await shadow.query('input[type="password"]')
            assert input_el is not None

    @pytest.mark.asyncio
    async def test_inner_html_closed(self, ci_chrome_options):
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(TEST_PAGE)
            await asyncio.sleep(0.5)

            host = await tab.find(id='closed-host')
            shadow = await host.get_shadow_root()

            html = await shadow.inner_html
            assert 'Closed shadow content' in html


class TestNestedShadowRoots:
    """Tests for nested shadow roots (open -> closed)."""

    @pytest.mark.asyncio
    async def test_nested_open_then_closed(self, ci_chrome_options):
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(TEST_PAGE)
            await asyncio.sleep(0.5)

            nested_host = await tab.find(id='nested-host')
            outer_shadow = await nested_host.get_shadow_root()
            assert outer_shadow.mode == ShadowRootType.OPEN

            outer_text = await outer_shadow.query('.outer-text')
            text = await outer_text.text
            assert text == 'Outer shadow'

            inner_host = await outer_shadow.query('#inner-host')
            inner_shadow = await inner_host.get_shadow_root()
            assert inner_shadow.mode == ShadowRootType.CLOSED

            inner_text = await inner_shadow.query('.inner-text')
            text = await inner_text.text
            assert text == 'Inner closed shadow'

            deep_btn = await inner_shadow.query('#deep-btn')
            assert deep_btn is not None


class TestShadowRootNotPresent:
    """Tests for elements without shadow roots."""

    @pytest.mark.asyncio
    async def test_no_shadow_root_raises(self, ci_chrome_options):
        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(TEST_PAGE)
            await asyncio.sleep(0.5)

            h1 = await tab.find(tag_name='h1')
            with pytest.raises(ShadowRootNotFound):
                await h1.get_shadow_root()


================================================
FILE: tests/test_socks5_proxy_forwarder.py
================================================
"""Tests for pydoll.utils.socks5_proxy_forwarder."""

from __future__ import annotations

import asyncio
import logging
from unittest.mock import AsyncMock, MagicMock, patch

import pytest

from pydoll.utils.socks5_proxy_forwarder import (
    HANDSHAKE_TIMEOUT,
    REPLY_ADDRESS_TYPE_NOT_SUPPORTED,
    REPLY_COMMAND_NOT_SUPPORTED,
    REPLY_CONNECTION_REFUSED,
    REPLY_GENERAL_FAILURE,
    REPLY_SUCCESS,
    SOCKS5Forwarder,
    _close_writer,
    _HandshakeError,
    _pipe,
    _read_exact,
    _skip_bnd_address,
    _suppress_closed,
)


# ---------------------------------------------------------------------------
# Fixtures
# ---------------------------------------------------------------------------


@pytest.fixture
def forwarder():
    return SOCKS5Forwarder(
        remote_host='proxy.example.com',
        remote_port=1080,
        username='user',
        password='pass',
        local_host='127.0.0.1',
        local_port=0,
    )


@pytest.fixture
def mock_reader():
    reader = AsyncMock(spec=asyncio.StreamReader)
    return reader


@pytest.fixture
def mock_writer():
    writer = MagicMock(spec=asyncio.StreamWriter)
    writer.close = MagicMock()
    writer.write = MagicMock()
    writer.drain = AsyncMock()
    writer.wait_closed = AsyncMock()
    return writer


# ---------------------------------------------------------------------------
# _suppress_closed
# ---------------------------------------------------------------------------


class TestSuppressClosed:
    def test_suppresses_os_error(self):
        with _suppress_closed():
            raise OSError('transport closed')

    def test_suppresses_connection_reset(self):
        with _suppress_closed():
            raise ConnectionResetError('reset')

    def test_does_not_suppress_value_error(self):
        with pytest.raises(ValueError, match='not an os error'):
            with _suppress_closed():
                raise ValueError('not an os error')

    def test_no_error_passes_through(self):
        with _suppress_closed():
            pass  # no exception


# ---------------------------------------------------------------------------
# _HandshakeError
# ---------------------------------------------------------------------------


class TestHandshakeError:
    def test_default_reply_code(self):
        exc = _HandshakeError('something failed')
        assert exc.reply_code == REPLY_GENERAL_FAILURE
        assert str(exc) == 'something failed'

    def test_custom_reply_code(self):
        exc = _HandshakeError('cmd not supported', reply_code=REPLY_COMMAND_NOT_SUPPORTED)
        assert exc.reply_code == REPLY_COMMAND_NOT_SUPPORTED

    def test_connection_refused_reply_code(self):
        exc = _HandshakeError('refused', reply_code=REPLY_CONNECTION_REFUSED)
        assert exc.reply_code == REPLY_CONNECTION_REFUSED

    def test_send_reply_defaults_to_true(self):
        exc = _HandshakeError('fail')
        assert exc.send_reply is True

    def test_send_reply_false(self):
        exc = _HandshakeError('no auth', send_reply=False)
        assert exc.send_reply is False


# ---------------------------------------------------------------------------
# _read_exact
# ---------------------------------------------------------------------------


class TestReadExact:
    @pytest.mark.asyncio
    async def test_returns_exact_bytes(self, mock_reader):
        mock_reader.readexactly = AsyncMock(return_value=b'\x05\x01')
        result = await _read_exact(mock_reader, 2)
        assert result == b'\x05\x01'
        mock_reader.readexactly.assert_awaited_once_with(2)

    @pytest.mark.asyncio
    async def test_incomplete_read_raises_handshake_error(self, mock_reader):
        mock_reader.readexactly = AsyncMock(
            side_effect=asyncio.IncompleteReadError(partial=b'\x05', expected=2)
        )
        with pytest.raises(_HandshakeError, match='Connection closed prematurely'):
            await _read_exact(mock_reader, 2)

    @pytest.mark.asyncio
    async def test_incomplete_read_has_general_failure_code(self, mock_reader):
        mock_reader.readexactly = AsyncMock(
            side_effect=asyncio.IncompleteReadError(partial=b'', expected=4)
        )
        with pytest.raises(_HandshakeError) as exc_info:
            await _read_exact(mock_reader, 4)
        assert exc_info.value.reply_code == REPLY_GENERAL_FAILURE

    @pytest.mark.asyncio
    async def test_timeout_raises_handshake_error(self, mock_reader):
        async def hang_forever(n):
            await asyncio.sleep(999)

        mock_reader.readexactly = hang_forever

        with patch(
            'pydoll.utils.socks5_proxy_forwarder.HANDSHAKE_TIMEOUT', 0.01
        ):
            with pytest.raises(_HandshakeError, match='Timed out reading'):
                await _read_exact(mock_reader, 2)

    @pytest.mark.asyncio
    async def test_timeout_has_general_failure_code(self, mock_reader):
        async def hang_forever(n):
            await asyncio.sleep(999)

        mock_reader.readexactly = hang_forever

        with patch(
            'pydoll.utils.socks5_proxy_forwarder.HANDSHAKE_TIMEOUT', 0.01
        ):
            with pytest.raises(_HandshakeError) as exc_info:
                await _read_exact(mock_reader, 2)
            assert exc_info.value.reply_code == REPLY_GENERAL_FAILURE

    @pytest.mark.asyncio
    async def test_peer_label_in_timeout_message(self, mock_reader):
        async def hang_forever(n):
            await asyncio.sleep(999)

        mock_reader.readexactly = hang_forever

        with patch(
            'pydoll.utils.socks5_proxy_forwarder.HANDSHAKE_TIMEOUT', 0.01
        ):
            with pytest.raises(_HandshakeError, match='from remote proxy'):
                await _read_exact(mock_reader, 2, peer='remote proxy')

    @pytest.mark.asyncio
    async def test_peer_label_in_incomplete_read_message(self, mock_reader):
        mock_reader.readexactly = AsyncMock(
            side_effect=asyncio.IncompleteReadError(partial=b'\x05', expected=4)
        )
        with pytest.raises(_HandshakeError, match='from client'):
            await _read_exact(mock_reader, 4, peer='client')


# ---------------------------------------------------------------------------
# _skip_bnd_address (uses _read_exact, not raw readexactly)
# ---------------------------------------------------------------------------


class TestSkipBndAddress:
    @pytest.mark.asyncio
    async def test_ipv4(self, mock_reader):
        mock_reader.readexactly = AsyncMock(return_value=b'\x00' * 6)
        await _skip_bnd_address(mock_reader, 0x01)
        mock_reader.readexactly.assert_awaited_once_with(6)

    @pytest.mark.asyncio
    async def test_domain(self, mock_reader):
        call_count = 0
        responses = [b'\x0b', b'\x00' * 13]

        async def fake_readexactly(n):
            nonlocal call_count
            result = responses[call_count]
            call_count += 1
            return result

        mock_reader.readexactly = fake_readexactly
        await _skip_bnd_address(mock_reader, 0x03)
        assert call_count == 2

    @pytest.mark.asyncio
    async def test_ipv6(self, mock_reader):
        mock_reader.readexactly = AsyncMock(return_value=b'\x00' * 18)
        await _skip_bnd_address(mock_reader, 0x04)
        mock_reader.readexactly.assert_awaited_once_with(18)

    @pytest.mark.asyncio
    async def test_incomplete_read_propagates(self, mock_reader):
        mock_reader.readexactly = AsyncMock(
            side_effect=asyncio.IncompleteReadError(partial=b'', expected=6)
        )
        with pytest.raises(_HandshakeError, match='Connection closed prematurely'):
            await _skip_bnd_address(mock_reader, 0x01)


# ---------------------------------------------------------------------------
# _close_writer
# ---------------------------------------------------------------------------


class TestCloseWriter:
    @pytest.mark.asyncio
    async def test_calls_close_and_wait_closed(self, mock_writer):
        await _close_writer(mock_writer)
        mock_writer.close.assert_called_once()
        mock_writer.wait_closed.assert_awaited_once()

    @pytest.mark.asyncio
    async def test_suppresses_os_error_on_close(self):
        writer = MagicMock(spec=asyncio.StreamWriter)
        writer.close = MagicMock(side_effect=OSError('already closed'))
        writer.wait_closed = AsyncMock()
        await _close_writer(writer)  # should not raise

    @pytest.mark.asyncio
    async def test_suppresses_os_error_on_wait_closed(self):
        writer = MagicMock(spec=asyncio.StreamWriter)
        writer.close = MagicMock()
        writer.wait_closed = AsyncMock(side_effect=OSError('transport closed'))
        await _close_writer(writer)  # should not raise


# ---------------------------------------------------------------------------
# _pipe
# ---------------------------------------------------------------------------


class TestPipe:
    @pytest.mark.asyncio
    async def test_forwards_data_until_eof(self, mock_reader, mock_writer):
        mock_reader.read = AsyncMock(side_effect=[b'hello', b'world', b''])
        await _pipe(mock_reader, mock_writer, 'test')
        assert mock_writer.write.call_count == 2
        mock_writer.write.assert_any_call(b'hello')
        mock_writer.write.assert_any_call(b'world')

    @pytest.mark.asyncio
    async def test_closes_writer_on_eof(self, mock_reader, mock_writer):
        mock_reader.read = AsyncMock(return_value=b'')
        await _pipe(mock_reader, mock_writer, 'test')
        mock_writer.close.assert_called_once()
        mock_writer.wait_closed.assert_awaited_once()

    @pytest.mark.asyncio
    async def test_closes_writer_on_connection_reset(self, mock_reader, mock_writer):
        mock_reader.read = AsyncMock(side_effect=ConnectionResetError)
        await _pipe(mock_reader, mock_writer, 'test')
        mock_writer.close.assert_called_once()


# ---------------------------------------------------------------------------
# SOCKS5Forwarder.__init__ — credential length validation
# ---------------------------------------------------------------------------


class TestCredentialValidation:
    def test_valid_credentials(self):
        fwd = SOCKS5Forwarder(
            remote_host='host',
            remote_port=1080,
            username='user',
            password='pass',
        )
        assert fwd.username == 'user'
        assert fwd.password == 'pass'

    def test_username_too_long(self):
        long_user = 'a' * 256
        with pytest.raises(ValueError, match='username must be at most 255 bytes'):
            SOCKS5Forwarder(
                remote_host='host',
                remote_port=1080,
                username=long_user,
                password='pass',
            )

    def test_password_too_long(self):
        long_pass = 'b' * 256
        with pytest.raises(ValueError, match='password must be at most 255 bytes'):
            SOCKS5Forwarder(
                remote_host='host',
                remote_port=1080,
                username='user',
                password=long_pass,
            )

    def test_max_length_credentials_accepted(self):
        fwd = SOCKS5Forwarder(
            remote_host='host',
            remote_port=1080,
            username='a' * 255,
            password='b' * 255,
        )
        assert len(fwd.username) == 255

    def test_multibyte_username_too_long(self):
        # Each emoji is 4 bytes in UTF-8; 64 emojis = 256 bytes > 255
        long_user = '\U0001f600' * 64
        with pytest.raises(ValueError, match='username must be at most 255 bytes'):
            SOCKS5Forwarder(
                remote_host='host',
                remote_port=1080,
                username=long_user,
                password='pass',
            )


# ---------------------------------------------------------------------------
# SOCKS5Forwarder.start — non-loopback warning
# ---------------------------------------------------------------------------


class TestNonLoopbackWarning:
    @pytest.mark.asyncio
    async def test_loopback_no_warning(self, forwarder, caplog):
        mock_server = AsyncMock()
        mock_sock = MagicMock()
        mock_sock.getsockname.return_value = ('127.0.0.1', 9999)
        mock_server.sockets = [mock_sock]

        with patch('asyncio.start_server', return_value=mock_server):
            with caplog.at_level(logging.WARNING):
                await forwarder.start()
            assert 'non-loopback' not in caplog.text

    @pytest.mark.asyncio
    async def test_non_loopback_warns(self, caplog):
        fwd = SOCKS5Forwarder(
            remote_host='proxy.example.com',
            remote_port=1080,
            username='user',
            password='pass',
            local_host='0.0.0.0',
        )
        mock_server = AsyncMock()
        mock_sock = MagicMock()
        mock_sock.getsockname.return_value = ('0.0.0.0', 9999)
        mock_server.sockets = [mock_sock]

        with patch('asyncio.start_server', return_value=mock_server):
            with caplog.at_level(logging.WARNING):
                await fwd.start()
            assert 'non-loopback' in caplog.text
            assert '0.0.0.0' in caplog.text

    @pytest.mark.asyncio
    async def test_ipv6_non_loopback_warns(self, caplog):
        fwd = SOCKS5Forwarder(
            remote_host='proxy.example.com',
            remote_port=1080,
            username='user',
            password='pass',
            local_host='::',
        )
        mock_server = AsyncMock()
        mock_sock = MagicMock()
        mock_sock.getsockname.return_value = ('::', 9999)
        mock_server.sockets = [mock_sock]

        with patch('asyncio.start_server', return_value=mock_server):
            with caplog.at_level(logging.WARNING):
                await fwd.start()
            assert 'non-loopback' in caplog.text

    @pytest.mark.asyncio
    async def test_hostname_does_not_crash(self, caplog):
        """local_host='localhost' should not raise ValueError from ip_address()."""
        fwd = SOCKS5Forwarder(
            remote_host='proxy.example.com',
            remote_port=1080,
            username='user',
            password='pass',
            local_host='localhost',
        )
        mock_server = AsyncMock()
        mock_sock = MagicMock()
        mock_sock.getsockname.return_value = ('127.0.0.1', 9999)
        mock_server.sockets = [mock_sock]

        with patch('asyncio.start_server', return_value=mock_server):
            with caplog.at_level(logging.WARNING):
                await fwd.start()
            assert 'non-loopback' not in caplog.text

    @pytest.mark.asyncio
    async def test_non_localhost_hostname_logs_debug(self, caplog):
        """A non-'localhost' hostname triggers a debug-level message."""
        fwd = SOCKS5Forwarder(
            remote_host='proxy.example.com',
            remote_port=1080,
            username='user',
            password='pass',
            local_host='myhost.local',
        )
        mock_server = AsyncMock()
        mock_sock = MagicMock()
        mock_sock.getsockname.return_value = ('192.168.1.5', 9999)
        mock_server.sockets = [mock_sock]

        with patch('asyncio.start_server', return_value=mock_server):
            with caplog.at_level(logging.DEBUG):
                await fwd.start()
            assert 'not an IP literal' in caplog.text

    @pytest.mark.asyncio
    async def test_multi_socket_divergent_ports_raises(self, forwarder):
        """start() raises RuntimeError if sockets have different ports."""
        mock_server = AsyncMock()
        sock1 = MagicMock()
        sock1.getsockname.return_value = ('127.0.0.1', 9998)
        sock2 = MagicMock()
        sock2.getsockname.return_value = ('::1', 9999)
        mock_server.sockets = [sock1, sock2]
        mock_server.close = MagicMock()
        mock_server.wait_closed = AsyncMock()

        with patch('asyncio.start_server', return_value=mock_server):
            with pytest.raises(RuntimeError, match='different ports'):
                await forwarder.start()

    @pytest.mark.asyncio
    async def test_multi_socket_same_port_ok(self, forwarder):
        """start() succeeds when all sockets share the same port."""
        mock_server = AsyncMock()
        sock1 = MagicMock()
        sock1.getsockname.return_value = ('127.0.0.1', 9999)
        sock2 = MagicMock()
        sock2.getsockname.return_value = ('::1', 9999)
        mock_server.sockets = [sock1, sock2]

        with patch('asyncio.start_server', return_value=mock_server):
            await forwarder.start()
        assert forwarder.local_port == 9999


# ---------------------------------------------------------------------------
# Credential masking in logs
# ---------------------------------------------------------------------------


class TestCredentialMasking:
    @pytest.mark.asyncio
    async def test_remote_handshake_does_not_log_credentials(self, forwarder, caplog):
        """Verify that _remote_handshake logs ulen/plen instead of raw hex."""
        reader = AsyncMock(spec=asyncio.StreamReader)
        writer = MagicMock(spec=asyncio.StreamWriter)
        writer.write = MagicMock()
        writer.drain = AsyncMock()

        # method selection: server picks username/password auth
        method_resp = bytes([0x05, 0x02])
        # auth response: success
        auth_resp = bytes([0x01, 0x00])
        # connect reply: success + IPv4
        connect_reply = bytes([0x05, 0x00, 0x00, 0x01])
        # BND.ADDR (IPv4) + BND.PORT
        bnd_addr = b'\x00\x00\x00\x00'
        bnd_port = b'\x00\x00'

        call_count = 0
        responses = [method_resp, auth_resp, connect_reply, bnd_addr, bnd_port]

        async def fake_readexactly(n):
            nonlocal call_count
            result = responses[call_count]
            call_count += 1
            return result

        reader.readexactly = fake_readexactly

        with caplog.at_level(logging.DEBUG):
            await forwarder._remote_handshake(
                reader, writer, bytes([0x01, 127, 0, 0, 1]), 80
            )

        log_text = caplog.text
        # The raw username/password should NOT appear in hex form
        username_hex = forwarder.username.encode().hex()
        password_hex = forwarder.password.encode().hex()
        assert username_hex not in log_text or 'ulen=' in log_text
        # But we should see the safe format
        assert 'ulen=4 plen=4' in log_text

    @pytest.mark.asyncio
    async def test_remote_connect_failure_propagates_rep_code(self, forwarder):
        """Remote proxy CONNECT failure REP code is forwarded to _HandshakeError."""
        reader = AsyncMock(spec=asyncio.StreamReader)
        writer = MagicMock(spec=asyncio.StreamWriter)
        writer.write = MagicMock()
        writer.drain = AsyncMock()

        # method selection: no-auth
        method_resp = bytes([0x05, 0x00])
        # connect reply: 0x05 = connection refused
        connect_reply = bytes([0x05, 0x05, 0x00, 0x01])

        call_count = 0
        responses = [method_resp, connect_reply]

        async def fake_readexactly(n):
            nonlocal call_count
            result = responses[call_count]
            call_count += 1
            return result

        reader.readexactly = fake_readexactly
        reader.read = AsyncMock(return_value=b'')

        with pytest.raises(_HandshakeError) as exc_info:
            await forwarder._remote_handshake(
                reader, writer, bytes([0x01, 127, 0, 0, 1]), 80
            )

        assert exc_info.value.reply_code == REPLY_CONNECTION_REFUSED
        assert 'rep=0x05' in str(exc_info.value)


# ---------------------------------------------------------------------------
# _handle_client — reply code routing
# ---------------------------------------------------------------------------


class TestHandleClientReplyCodes:
    @pytest.mark.asyncio
    async def test_handshake_error_uses_exc_reply_code(self, forwarder):
        """_HandshakeError.reply_code flows to _send_reply."""
        client_reader = AsyncMock(spec=asyncio.StreamReader)
        client_writer = MagicMock(spec=asyncio.StreamWriter)
        client_writer.write = MagicMock()
        client_writer.drain = AsyncMock()
        client_writer.close = MagicMock()
        client_writer.wait_closed = AsyncMock()

        with patch.object(
            forwarder,
            '_accept_local_handshake',
            side_effect=_HandshakeError('bad cmd', reply_code=REPLY_COMMAND_NOT_SUPPORTED),
        ), patch.object(forwarder, '_send_reply', new_callable=AsyncMock) as mock_reply:
            await forwarder._handle_client(client_reader, client_writer)
            mock_reply.assert_awaited_once_with(client_writer, REPLY_COMMAND_NOT_SUPPORTED)

    @pytest.mark.asyncio
    async def test_connection_refused_uses_specific_code(self, forwarder):
        """ConnectionRefusedError -> REPLY_CONNECTION_REFUSED."""
        client_reader = AsyncMock(spec=asyncio.StreamReader)
        client_writer = MagicMock(spec=asyncio.StreamWriter)
        client_writer.write = MagicMock()
        client_writer.drain = AsyncMock()
        client_writer.close = MagicMock()
        client_writer.wait_closed = AsyncMock()

        with patch.object(
            forwarder,
            '_accept_local_handshake',
            return_value=(b'\x01\x7f\x00\x00\x01', 80),
        ), patch(
            'asyncio.open_connection',
            side_effect=ConnectionRefusedError('refused'),
        ), patch.object(forwarder, '_send_reply', new_callable=AsyncMock) as mock_reply:
            await forwarder._handle_client(client_reader, client_writer)
            mock_reply.assert_awaited_once_with(
                client_writer, REPLY_CONNECTION_REFUSED
            )

    @pytest.mark.asyncio
    async def test_generic_os_error_uses_general_failure(self, forwarder):
        """Non-ConnectionRefused OSError -> REPLY_GENERAL_FAILURE."""
        client_reader = AsyncMock(spec=asyncio.StreamReader)
        client_writer = MagicMock(spec=asyncio.StreamWriter)
        client_writer.write = MagicMock()
        client_writer.drain = AsyncMock()
        client_writer.close = MagicMock()
        client_writer.wait_closed = AsyncMock()

        with patch.object(
            forwarder,
            '_accept_local_handshake',
            return_value=(b'\x01\x7f\x00\x00\x01', 80),
        ), patch(
            'asyncio.open_connection',
            side_effect=OSError('network unreachable'),
        ), patch.object(forwarder, '_send_reply', new_callable=AsyncMock) as mock_reply:
            await forwarder._handle_client(client_reader, client_writer)
            mock_reply.assert_awaited_once_with(client_writer, REPLY_GENERAL_FAILURE)

    @pytest.mark.asyncio
    async def test_open_connection_timeout_sends_general_failure(self, forwarder):
        """asyncio.TimeoutError from open_connection -> REPLY_GENERAL_FAILURE."""
        client_reader = AsyncMock(spec=asyncio.StreamReader)
        client_writer = MagicMock(spec=asyncio.StreamWriter)
        client_writer.write = MagicMock()
        client_writer.drain = AsyncMock()
        client_writer.close = MagicMock()
        client_writer.wait_closed = AsyncMock()

        with patch.object(
            forwarder,
            '_accept_local_handshake',
            return_value=(b'\x01\x7f\x00\x00\x01', 80),
        ), patch(
            'asyncio.open_connection',
            new_callable=AsyncMock,
        ), patch(
            'asyncio.wait_for',
            side_effect=asyncio.TimeoutError(),
        ), patch.object(forwarder, '_send_reply', new_callable=AsyncMock) as mock_reply:
            await forwarder._handle_client(client_reader, client_writer)
            mock_reply.assert_awaited_once_with(client_writer, REPLY_GENERAL_FAILURE)

    @pytest.mark.asyncio
    async def test_send_reply_false_skips_reply(self, forwarder):
        """_HandshakeError with send_reply=False should not call _send_reply."""
        client_reader = AsyncMock(spec=asyncio.StreamReader)
        client_writer = MagicMock(spec=asyncio.StreamWriter)
        client_writer.write = MagicMock()
        client_writer.drain = AsyncMock()
        client_writer.close = MagicMock()
        client_writer.wait_closed = AsyncMock()

        with patch.object(
            forwarder,
            '_accept_local_handshake',
            side_effect=_HandshakeError('no auth', send_reply=False),
        ), patch.object(forwarder, '_send_reply', new_callable=AsyncMock) as mock_reply:
            await forwarder._handle_client(client_reader, client_writer)
            mock_reply.assert_not_awaited()

    @pytest.mark.asyncio
    async def test_handle_client_closes_both_writers(self, forwarder):
        """Both client and remote writers are closed in the finally block."""
        client_reader = AsyncMock(spec=asyncio.StreamReader)
        client_writer = MagicMock(spec=asyncio.StreamWriter)
        client_writer.write = MagicMock()
        client_writer.drain = AsyncMock()
        client_writer.close = MagicMock()
        client_writer.wait_closed = AsyncMock()

        remote_writer = MagicMock(spec=asyncio.StreamWriter)
        remote_writer.write = MagicMock()
        remote_writer.drain = AsyncMock()
        remote_writer.close = MagicMock()
        remote_writer.wait_closed = AsyncMock()

        remote_reader = AsyncMock(spec=asyncio.StreamReader)

        with patch.object(
            forwarder,
            '_accept_local_handshake',
            return_value=(b'\x01\x7f\x00\x00\x01', 80),
        ), patch(
            'asyncio.open_connection',
            return_value=(remote_reader, remote_writer),
        ), patch.object(
            forwarder,
            '_remote_handshake',
            side_effect=_HandshakeError('fail'),
        ), patch.object(forwarder, '_send_reply', new_callable=AsyncMock):
            await forwarder._handle_client(client_reader, client_writer)

        client_writer.close.assert_called_once()
        client_writer.wait_closed.assert_awaited_once()
        remote_writer.close.assert_called_once()
        remote_writer.wait_closed.assert_awaited_once()


# ---------------------------------------------------------------------------
# SOCKS5Forwarder._send_reply
# ---------------------------------------------------------------------------


class TestSendReply:
    @pytest.mark.asyncio
    async def test_sends_correct_reply(self, mock_writer):
        await SOCKS5Forwarder._send_reply(mock_writer, REPLY_SUCCESS)
        written = mock_writer.write.call_args[0][0]
        assert written[0] == 0x05  # SOCKS5
        assert written[1] == REPLY_SUCCESS
        mock_writer.drain.assert_awaited_once()

    @pytest.mark.asyncio
    async def test_sends_failure_reply(self, mock_writer):
        await SOCKS5Forwarder._send_reply(mock_writer, REPLY_CONNECTION_REFUSED)
        written = mock_writer.write.call_args[0][0]
        assert written[1] == REPLY_CONNECTION_REFUSED


# ---------------------------------------------------------------------------
# _accept_local_handshake — pre-CONNECT send_reply=False and reply codes
# ---------------------------------------------------------------------------


class TestAcceptLocalHandshake:
    @pytest.mark.asyncio
    async def test_greeting_eof_has_send_reply_false(self, forwarder):
        """If _read_exact fails during greeting, send_reply must be False."""
        reader = AsyncMock(spec=asyncio.StreamReader)
        writer = MagicMock(spec=asyncio.StreamWriter)
        writer.write = MagicMock()
        writer.drain = AsyncMock()

        reader.readexactly = AsyncMock(
            side_effect=asyncio.IncompleteReadError(partial=b'', expected=2)
        )

        with pytest.raises(_HandshakeError) as exc_info:
            await forwarder._accept_local_handshake(reader, writer)
        assert exc_info.value.send_reply is False

    @pytest.mark.asyncio
    async def test_unsupported_version_has_send_reply_false(self, forwarder):
        """Bad SOCKS version in greeting → send_reply=False."""
        reader = AsyncMock(spec=asyncio.StreamReader)
        writer = MagicMock(spec=asyncio.StreamWriter)
        writer.write = MagicMock()
        writer.drain = AsyncMock()

        reader.readexactly = AsyncMock(return_value=bytes([0x04, 0x01]))

        with pytest.raises(_HandshakeError, match='Unsupported SOCKS version') as exc_info:
            await forwarder._accept_local_handshake(reader, writer)
        assert exc_info.value.send_reply is False

    @pytest.mark.asyncio
    async def test_unsupported_command_uses_reply_code_0x07(self, forwarder):
        """CMD != CONNECT → REPLY_COMMAND_NOT_SUPPORTED."""
        reader = AsyncMock(spec=asyncio.StreamReader)
        writer = MagicMock(spec=asyncio.StreamWriter)
        writer.write = MagicMock()
        writer.drain = AsyncMock()

        call_count = 0
        responses = [
            bytes([0x05, 0x01]),  # VER, NMETHODS
            bytes([0x00]),  # method: no-auth
            bytes([0x05, 0x02, 0x00, 0x01]),  # VER, CMD=BIND(0x02), RSV, ATYP
        ]

        async def fake_readexactly(n):
            nonlocal call_count
            result = responses[call_count]
            call_count += 1
            return result

        reader.readexactly = fake_readexactly

        with pytest.raises(_HandshakeError) as exc_info:
            await forwarder._accept_local_handshake(reader, writer)
        assert exc_info.value.reply_code == REPLY_COMMAND_NOT_SUPPORTED

    @pytest.mark.asyncio
    async def test_unsupported_address_type_uses_reply_code_0x08(self, forwarder):
        """Unknown ATYP → REPLY_ADDRESS_TYPE_NOT_SUPPORTED."""
        reader = AsyncMock(spec=asyncio.StreamReader)
        writer = MagicMock(spec=asyncio.StreamWriter)
        writer.write = MagicMock()
        writer.drain = AsyncMock()

        call_count = 0
        responses = [
            bytes([0x05, 0x01]),  # VER, NMETHODS
            bytes([0x00]),  # method: no-auth
            bytes([0x05, 0x01, 0x00, 0xFF]),  # VER, CMD=CONNECT, RSV, ATYP=0xFF (unknown)
        ]

        async def fake_readexactly(n):
            nonlocal call_count
            result = responses[call_count]
            call_count += 1
            return result

        reader.readexactly = fake_readexactly

        with pytest.raises(_HandshakeError) as exc_info:
            await forwarder._accept_local_handshake(reader, writer)
        assert exc_info.value.reply_code == REPLY_ADDRESS_TYPE_NOT_SUPPORTED


# ---------------------------------------------------------------------------
# Constants
# ---------------------------------------------------------------------------


class TestConstants:
    def test_handshake_timeout_is_positive(self):
        assert HANDSHAKE_TIMEOUT > 0

    def test_reply_codes_are_distinct(self):
        codes = {
            REPLY_SUCCESS,
            REPLY_GENERAL_FAILURE,
            REPLY_CONNECTION_REFUSED,
            REPLY_COMMAND_NOT_SUPPORTED,
            REPLY_ADDRESS_TYPE_NOT_SUPPORTED,
        }
        assert len(codes) == 5


================================================
FILE: tests/test_user_agent_parser.py
================================================
"""
Tests for UserAgentParser class.

Verifies that User-Agent strings are parsed into consistent metadata
for CDP Emulation.setUserAgentOverride and navigator JS overrides.
"""

import pytest

from pydoll.utils.user_agent_parser import UserAgentParser, ParsedUserAgent


# --- Chrome on Windows ---

CHROME_WINDOWS_UA = (
    'Mozilla/5.0 (Windows NT 10.0; Win64; x64) '
    'AppleWebKit/537.36 (KHTML, like Gecko) '
    'Chrome/120.0.6099.109 Safari/537.36'
)


class TestChromeWindows:
    def test_platform(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        assert result.platform == 'Win32'

    def test_vendor(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        assert result.vendor == 'Google Inc.'

    def test_app_version(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        assert result.app_version.startswith('5.0 (Windows NT 10.0')

    def test_metadata_platform(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        assert result.user_agent_metadata['platform'] == 'Windows'

    def test_metadata_platform_version(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        assert result.user_agent_metadata['platformVersion'] == '15.0.0'

    def test_metadata_architecture(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        assert result.user_agent_metadata['architecture'] == 'x86'

    def test_metadata_mobile(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        assert result.user_agent_metadata['mobile'] is False

    def test_metadata_model_empty(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        assert result.user_agent_metadata['model'] == ''

    def test_metadata_bitness(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        assert result.user_agent_metadata['bitness'] == '64'

    def test_metadata_wow64(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        assert result.user_agent_metadata['wow64'] is False

    def test_brands_contains_chromium(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        brands = result.user_agent_metadata['brands']
        brand_names = [b['brand'] for b in brands]
        assert 'Chromium' in brand_names

    def test_brands_contains_chrome(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        brands = result.user_agent_metadata['brands']
        brand_names = [b['brand'] for b in brands]
        assert 'Google Chrome' in brand_names

    def test_brands_contains_grease(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        brands = result.user_agent_metadata['brands']
        assert len(brands) == 3
        # First brand is GREASE
        assert brands[0]['brand'] not in {'Chromium', 'Google Chrome', 'Microsoft Edge'}

    def test_brands_major_version(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        brands = result.user_agent_metadata['brands']
        chromium_brand = next(b for b in brands if b['brand'] == 'Chromium')
        assert chromium_brand['version'] == '120'

    def test_full_version_list(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        fvl = result.user_agent_metadata['fullVersionList']
        chromium_fv = next(b for b in fvl if b['brand'] == 'Chromium')
        assert chromium_fv['version'] == '120.0.6099.109'

    def test_navigator_js_contains_vendor(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        assert "Navigator.prototype, 'vendor'" in result.navigator_override_js

    def test_navigator_js_contains_app_version(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        assert "Navigator.prototype, 'appVersion'" in result.navigator_override_js


# --- Chrome on macOS ---

CHROME_MACOS_UA = (
    'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) '
    'AppleWebKit/537.36 (KHTML, like Gecko) '
    'Chrome/121.0.6167.85 Safari/537.36'
)


class TestChromeMacOS:
    def test_platform(self):
        result = UserAgentParser.parse(CHROME_MACOS_UA)
        assert result.platform == 'MacIntel'

    def test_metadata_platform(self):
        result = UserAgentParser.parse(CHROME_MACOS_UA)
        assert result.user_agent_metadata['platform'] == 'macOS'

    def test_metadata_platform_version(self):
        result = UserAgentParser.parse(CHROME_MACOS_UA)
        assert result.user_agent_metadata['platformVersion'] == '10.15.7'

    def test_metadata_architecture(self):
        result = UserAgentParser.parse(CHROME_MACOS_UA)
        assert result.user_agent_metadata['architecture'] == 'arm'

    def test_brands_version(self):
        result = UserAgentParser.parse(CHROME_MACOS_UA)
        brands = result.user_agent_metadata['brands']
        chromium_brand = next(b for b in brands if b['brand'] == 'Chromium')
        assert chromium_brand['version'] == '121'


# --- Chrome on Linux ---

CHROME_LINUX_UA = (
    'Mozilla/5.0 (X11; Linux x86_64) '
    'AppleWebKit/537.36 (KHTML, like Gecko) '
    'Chrome/122.0.6261.94 Safari/537.36'
)


class TestChromeLinux:
    def test_platform(self):
        result = UserAgentParser.parse(CHROME_LINUX_UA)
        assert result.platform == 'Linux x86_64'

    def test_metadata_platform(self):
        result = UserAgentParser.parse(CHROME_LINUX_UA)
        assert result.user_agent_metadata['platform'] == 'Linux'

    def test_metadata_platform_version(self):
        result = UserAgentParser.parse(CHROME_LINUX_UA)
        assert result.user_agent_metadata['platformVersion'] == '6.1.0'

    def test_metadata_architecture(self):
        result = UserAgentParser.parse(CHROME_LINUX_UA)
        assert result.user_agent_metadata['architecture'] == 'x86'


# --- Edge on Windows ---

EDGE_WINDOWS_UA = (
    'Mozilla/5.0 (Windows NT 10.0; Win64; x64) '
    'AppleWebKit/537.36 (KHTML, like Gecko) '
    'Chrome/120.0.0.0 Safari/537.36 Edg/120.0.2210.91'
)


class TestEdgeWindows:
    def test_platform(self):
        result = UserAgentParser.parse(EDGE_WINDOWS_UA)
        assert result.platform == 'Win32'

    def test_brands_contains_edge(self):
        result = UserAgentParser.parse(EDGE_WINDOWS_UA)
        brands = result.user_agent_metadata['brands']
        brand_names = [b['brand'] for b in brands]
        assert 'Microsoft Edge' in brand_names

    def test_brands_does_not_contain_chrome(self):
        result = UserAgentParser.parse(EDGE_WINDOWS_UA)
        brands = result.user_agent_metadata['brands']
        brand_names = [b['brand'] for b in brands]
        assert 'Google Chrome' not in brand_names

    def test_brands_chromium_present(self):
        result = UserAgentParser.parse(EDGE_WINDOWS_UA)
        brands = result.user_agent_metadata['brands']
        brand_names = [b['brand'] for b in brands]
        assert 'Chromium' in brand_names

    def test_full_version_list_edge_version(self):
        result = UserAgentParser.parse(EDGE_WINDOWS_UA)
        fvl = result.user_agent_metadata['fullVersionList']
        edge_fv = next(b for b in fvl if b['brand'] == 'Microsoft Edge')
        assert edge_fv['version'] == '120.0.2210.91'


# --- Android Chrome ---

CHROME_ANDROID_UA = (
    'Mozilla/5.0 (Linux; Android 14; Pixel 7 Build/AP2A.240805.005) '
    'AppleWebKit/537.36 (KHTML, like Gecko) '
    'Chrome/120.0.6099.144 Mobile Safari/537.36'
)


class TestChromeAndroid:
    def test_platform(self):
        result = UserAgentParser.parse(CHROME_ANDROID_UA)
        assert result.platform == 'Linux armv81'

    def test_metadata_platform(self):
        result = UserAgentParser.parse(CHROME_ANDROID_UA)
        assert result.user_agent_metadata['platform'] == 'Android'

    def test_metadata_platform_version(self):
        result = UserAgentParser.parse(CHROME_ANDROID_UA)
        assert result.user_agent_metadata['platformVersion'] == '14'

    def test_metadata_mobile(self):
        result = UserAgentParser.parse(CHROME_ANDROID_UA)
        assert result.user_agent_metadata['mobile'] is True

    def test_metadata_model(self):
        result = UserAgentParser.parse(CHROME_ANDROID_UA)
        assert result.user_agent_metadata['model'] == 'Pixel 7'

    def test_metadata_architecture(self):
        result = UserAgentParser.parse(CHROME_ANDROID_UA)
        assert result.user_agent_metadata['architecture'] == 'arm'


# --- iPhone Safari-like UA ---

IPHONE_UA = (
    'Mozilla/5.0 (iPhone; CPU iPhone OS 17_1_2 like Mac OS X) '
    'AppleWebKit/605.1.15 (KHTML, like Gecko) '
    'CriOS/120.0.6099.119 Mobile/15E148 Safari/604.1'
)


class TestIPhone:
    def test_platform(self):
        result = UserAgentParser.parse(IPHONE_UA)
        assert result.platform == 'iPhone'

    def test_metadata_platform(self):
        result = UserAgentParser.parse(IPHONE_UA)
        assert result.user_agent_metadata['platform'] == 'iOS'

    def test_metadata_platform_version(self):
        result = UserAgentParser.parse(IPHONE_UA)
        assert result.user_agent_metadata['platformVersion'] == '17.1.2'

    def test_metadata_mobile(self):
        result = UserAgentParser.parse(IPHONE_UA)
        assert result.user_agent_metadata['mobile'] is True

    def test_metadata_architecture(self):
        result = UserAgentParser.parse(IPHONE_UA)
        assert result.user_agent_metadata['architecture'] == 'arm'


# --- Old Windows versions ---

class TestWindowsVersionMapping:
    def test_windows_7(self):
        ua = (
            'Mozilla/5.0 (Windows NT 6.1; Win64; x64) '
            'AppleWebKit/537.36 Chrome/120.0.6099.109 Safari/537.36'
        )
        result = UserAgentParser.parse(ua)
        assert result.user_agent_metadata['platformVersion'] == '0.1.0'

    def test_windows_8(self):
        ua = (
            'Mozilla/5.0 (Windows NT 6.2; Win64; x64) '
            'AppleWebKit/537.36 Chrome/120.0.6099.109 Safari/537.36'
        )
        result = UserAgentParser.parse(ua)
        assert result.user_agent_metadata['platformVersion'] == '0.2.0'

    def test_windows_8_1(self):
        ua = (
            'Mozilla/5.0 (Windows NT 6.3; Win64; x64) '
            'AppleWebKit/537.36 Chrome/120.0.6099.109 Safari/537.36'
        )
        result = UserAgentParser.parse(ua)
        assert result.user_agent_metadata['platformVersion'] == '0.3.0'


# --- GREASE brands ---

class TestGreaseBrands:
    def test_grease_brand_is_first(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        brands = result.user_agent_metadata['brands']
        grease_brand = brands[0]['brand']
        assert grease_brand not in {'Chromium', 'Google Chrome', 'Microsoft Edge'}

    def test_full_version_list_grease_is_first(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        fvl = result.user_agent_metadata['fullVersionList']
        grease_brand = fvl[0]['brand']
        assert grease_brand not in {'Chromium', 'Google Chrome', 'Microsoft Edge'}

    def test_grease_version_format_for_brands(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        brands = result.user_agent_metadata['brands']
        grease_version = brands[0]['version']
        assert grease_version.isdigit()

    def test_grease_version_format_for_full_version_list(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        fvl = result.user_agent_metadata['fullVersionList']
        grease_version = fvl[0]['version']
        assert '.' in grease_version


# --- Edge cases ---

class TestEdgeCases:
    def test_unknown_browser_defaults_to_chrome(self):
        ua = 'Some random string without browser info'
        result = UserAgentParser.parse(ua)
        brands = result.user_agent_metadata['brands']
        brand_names = [b['brand'] for b in brands]
        assert 'Google Chrome' in brand_names

    def test_unknown_os_defaults_to_windows(self):
        ua = (
            'Mozilla/5.0 AppleWebKit/537.36 '
            'Chrome/120.0.6099.109 Safari/537.36'
        )
        result = UserAgentParser.parse(ua)
        assert result.platform == 'Win32'
        assert result.user_agent_metadata['platform'] == 'Windows'

    def test_returns_parsed_user_agent_type(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        assert isinstance(result, ParsedUserAgent)

    def test_navigator_js_escapes_single_quotes(self):
        ua = (
            "Mozilla/5.0 (Windows NT 10.0; Win64; x64) "
            "AppleWebKit/537.36 Chrome/120.0.6099.109 Safari/537.36"
        )
        result = UserAgentParser.parse(ua)
        assert "\\'" not in result.navigator_override_js or "'" in result.vendor

    def test_app_version_strips_mozilla_prefix(self):
        result = UserAgentParser.parse(CHROME_WINDOWS_UA)
        assert not result.app_version.startswith('Mozilla/')
        assert result.app_version.startswith('5.0')

    def test_non_mozilla_ua_keeps_full_string(self):
        ua = 'CustomBot/1.0 Chrome/120.0.6099.109'
        result = UserAgentParser.parse(ua)
        assert result.app_version == ua


# --- ChromeOS ---

CHROMEOS_UA = (
    'Mozilla/5.0 (X11; CrOS x86_64 14541.0.0) '
    'AppleWebKit/537.36 (KHTML, like Gecko) '
    'Chrome/120.0.6099.109 Safari/537.36'
)


class TestChromeOS:
    def test_platform(self):
        result = UserAgentParser.parse(CHROMEOS_UA)
        assert result.platform == 'Linux x86_64'

    def test_metadata_platform(self):
        result = UserAgentParser.parse(CHROMEOS_UA)
        assert result.user_agent_metadata['platform'] == 'Chrome OS'

    def test_metadata_platform_version(self):
        result = UserAgentParser.parse(CHROMEOS_UA)
        assert result.user_agent_metadata['platformVersion'] == '14541.0.0'


================================================
FILE: tests/test_utils.py
================================================
import aiohttp
import pytest
from aioresponses import aioresponses
import tempfile
import os
import sys
from unittest.mock import patch

from pydoll import exceptions
from pydoll.utils import (
    clean_script_for_analysis,
    decode_base64_to_bytes,
    get_browser_ws_address,
    has_return_outside_function,
    is_script_already_function,
    validate_browser_paths,
    extract_text_from_html,
)


class TestUtils:
    """
    Test class for utility functions in the pydoll.utils module.
    Groups tests related to image decoding, browser communication, and path validation.
    """

    def test_decode_image_to_bytes(self):
        """
        Test the decode_base64_to_bytes function.
        Verifies that the function correctly decodes a base64 string
        to its original bytes.
        """
        base64code = 'aGVsbG8gd29ybGQ='  # 'hello world' in base64
        assert decode_base64_to_bytes(base64code) == b'hello world'

    def test_decode_image_to_bytes_empty_string(self):
        """
        Test decode_base64_to_bytes with empty string.
        Verifies that the function handles empty input correctly.
        """
        assert decode_base64_to_bytes('') == b''

    def test_decode_image_to_bytes_complex_data(self):
        """
        Test decode_base64_to_bytes with more complex base64 data.
        Verifies that the function can handle longer, more complex encoded data.
        """
        # Base64 for "The quick brown fox jumps over the lazy dog"
        base64code = 'VGhlIHF1aWNrIGJyb3duIGZveCBqdW1wcyBvdmVyIHRoZSBsYXp5IGRvZw=='
        expected = b'The quick brown fox jumps over the lazy dog'
        assert decode_base64_to_bytes(base64code) == expected

    @pytest.mark.asyncio
    async def test_successful_response(self):
        """
        Test successful scenario when getting browser WebSocket address.
        Verifies that the function correctly returns the WebSocket URL when
        the API response contains the expected field.
        """
        port = 9222
        expected_url = 'ws://localhost:9222/devtools/browser/abc123'

        with aioresponses() as mocked:
            mocked.get(
                f'http://localhost:{port}/json/version',
                payload={'webSocketDebuggerUrl': expected_url},
            )
            result = await get_browser_ws_address(port)
            assert result == expected_url

    @pytest.mark.asyncio
    async def test_network_error(self):
        """
        Test behavior when a network error occurs.
        Verifies that the function raises the appropriate NetworkError exception
        when there's a communication failure with the browser.
        """
        port = 9222

        with pytest.raises(exceptions.NetworkError):
            with aioresponses() as mocked:
                mocked.get(
                    f'http://localhost:{port}/json/version',
                    exception=aiohttp.ClientError,
                )
                await get_browser_ws_address(port)

    @pytest.mark.asyncio
    async def test_missing_websocket_url(self):
        """
        Test behavior when API response doesn't contain WebSocket URL.
        Verifies that the function raises InvalidResponse exception when the
        'webSocketDebuggerUrl' field is missing from the response.
        """
        port = 9222

        with aioresponses() as mocked:
            mocked.get(
                f'http://localhost:{port}/json/version',
                payload={'someOtherKey': 'value'},
            )
            with pytest.raises(exceptions.InvalidResponse):
                await get_browser_ws_address(port)

    @pytest.mark.asyncio
    async def test_http_error_status(self):
        """
        Test behavior when HTTP request returns an error status.
        Verifies that the function raises NetworkError when the server
        returns an HTTP error status code.
        """
        port = 9222

        with pytest.raises(exceptions.NetworkError):
            with aioresponses() as mocked:
                mocked.get(
                    f'http://localhost:{port}/json/version',
                    status=404
                )
                await get_browser_ws_address(port)

    @pytest.mark.asyncio
    async def test_custom_port(self):
        """
        Test get_browser_ws_address with a custom port.
        Verifies that the function works correctly with non-default ports.
        """
        port = 9333
        expected_url = 'ws://localhost:9333/devtools/browser/xyz789'

        with aioresponses() as mocked:
            mocked.get(
                f'http://localhost:{port}/json/version',
                payload={'webSocketDebuggerUrl': expected_url},
            )
            result = await get_browser_ws_address(port)
            assert result == expected_url

    def test_validate_browser_paths_success(self):
        """
        Test validate_browser_paths with valid executable path.
        Verifies that the function returns the first valid path found.
        """
        with tempfile.TemporaryDirectory() as temp_dir:
            # Create a temporary executable file
            valid_path = os.path.join(temp_dir, 'browser')
            with open(valid_path, 'w') as f:
                f.write('#!/bin/bash\necho "browser"')
            os.chmod(valid_path, 0o755)  # Make it executable
            
            invalid_path = '/nonexistent/browser'
            paths = [invalid_path, valid_path]
            
            result = validate_browser_paths(paths)
            assert result == valid_path

    def test_validate_browser_paths_first_valid_wins(self):
        """
        Test that validate_browser_paths returns the first valid path.
        Verifies that when multiple valid paths exist, the first one is returned.
        """
        with tempfile.TemporaryDirectory() as temp_dir:
            # Create two valid executable files
            first_valid = os.path.join(temp_dir, 'browser1')
            second_valid = os.path.join(temp_dir, 'browser2')
            
            for path in [first_valid, second_valid]:
                with open(path, 'w') as f:
                    f.write('#!/bin/bash\necho "browser"')
                os.chmod(path, 0o755)
            
            paths = [first_valid, second_valid]
            result = validate_browser_paths(paths)
            assert result == first_valid

    def test_validate_browser_paths_no_valid_paths(self):
        """
        Test validate_browser_paths when no valid paths exist.
        Verifies that InvalidBrowserPath exception is raised when no
        executable browser is found in the provided paths.
        """
        invalid_paths = [
            '/nonexistent/browser1',
            '/nonexistent/browser2',
            '/nonexistent/browser3'
        ]
        
        with pytest.raises(exceptions.InvalidBrowserPath) as exc_info:
            validate_browser_paths(invalid_paths)
        
        assert 'No valid browser path found in:' in str(exc_info.value)

    @pytest.mark.skipif(sys.platform.startswith('win'), reason='No executable bit on NTFS on Windows')
    def test_validate_browser_paths_file_exists_but_not_executable(self):
        """
        Test validate_browser_paths with non-executable file.
        Verifies that a file that exists but is not executable is not considered valid.
        """
        with tempfile.TemporaryDirectory() as temp_dir:
            # Create a file that exists but is not executable
            non_executable = os.path.join(temp_dir, 'browser')
            with open(non_executable, 'w') as f:
                f.write('not executable')
            # Don't set executable permissions

            with pytest.raises(exceptions.InvalidBrowserPath):
                validate_browser_paths([non_executable])

    @pytest.mark.skipif(sys.platform.startswith('win'), reason='No executable bit on NTFS on Windows')
    def test_validate_browser_paths_directory_instead_of_file(self):
        """
        Test validate_browser_paths with a directory path.
        Verifies that directories are not treated as valid executables even if they have execute permission.
        """
        with tempfile.TemporaryDirectory() as temp_dir:
            os.chmod(temp_dir, 0o755)
            with pytest.raises(exceptions.InvalidBrowserPath):
                validate_browser_paths([temp_dir])

    def test_validate_browser_paths_empty_list(self):
        """
        Test validate_browser_paths with empty path list.
        Verifies that InvalidBrowserPath exception is raised when
        an empty list of paths is provided.
        """
        with pytest.raises(exceptions.InvalidBrowserPath):
            validate_browser_paths([])

    def test_validate_browser_paths_mixed_valid_invalid(self):
        """
        Test validate_browser_paths with mix of valid and invalid paths.
        Verifies that the function skips invalid paths and returns the first valid one.
        """
        with tempfile.TemporaryDirectory() as temp_dir:
            # Create one valid executable
            valid_path = os.path.join(temp_dir, 'browser')
            with open(valid_path, 'w') as f:
                f.write('#!/bin/bash\necho "browser"')
            os.chmod(valid_path, 0o755)
            
            # Mix valid and invalid paths
            paths = [
                '/nonexistent/browser1',
                '/nonexistent/browser2',
                valid_path,
                '/nonexistent/browser3'
            ]
            
            result = validate_browser_paths(paths)
            assert result == valid_path


class TestDecodeBase64ToBytes:
    """Test decode_base64_to_bytes function."""

    def test_decode_base64_to_bytes_valid_input(self):
        """Test decoding valid base64 string."""
        base64_string = 'SGVsbG8gV29ybGQ='  # "Hello World" in base64
        result = decode_base64_to_bytes(base64_string)
        assert result == b'Hello World'

    def test_decode_base64_to_bytes_empty_string(self):
        """Test decoding empty base64 string."""
        result = decode_base64_to_bytes('')
        assert result == b''


class TestValidateBrowserPaths:
    """Test validate_browser_paths function."""

    def test_validate_browser_paths_valid_path(self, tmp_path):
        """Test with valid executable path."""
        # Create a temporary executable file
        executable = tmp_path / "browser"
        executable.write_text("#!/bin/bash\necho 'browser'")
        executable.chmod(0o755)
        
        result = validate_browser_paths([str(executable)])
        assert result == str(executable)

    def test_validate_browser_paths_invalid_paths(self):
        """Test with invalid paths."""
        from pydoll.exceptions import InvalidBrowserPath
        
        with pytest.raises(InvalidBrowserPath):
            validate_browser_paths(['/nonexistent/path', '/another/invalid/path'])


class TestScriptAnalysisFunctions:
    """Test JavaScript script analysis functions."""

    def test_clean_script_for_analysis_removes_comments(self):
        """Test that comments are removed from script."""
        script = '''
        // This is a line comment
        var x = 5;
        /* This is a block comment */
        return x;
        '''
        
        result = clean_script_for_analysis(script)
        
        assert '// This is a line comment' not in result
        assert '/* This is a block comment */' not in result
        assert 'var x = 5;' in result
        assert 'return x;' in result

    def test_clean_script_for_analysis_removes_strings(self):
        """Test that string literals are removed from script."""
        script = '''
        var message = "This string contains return statement";
        var another = 'Another string with return';
        var template = `Template literal with return`;
        return "actual return";
        '''
        
        result = clean_script_for_analysis(script)
        
        assert 'This string contains return statement' not in result
        assert 'Another string with return' not in result
        assert 'Template literal with return' not in result
        assert 'return ""' in result  # String replaced with empty quotes

    def test_is_script_already_function_regular_function(self):
        """Test detection of regular function declaration."""
        script = 'function() { console.log("test"); }'
        assert is_script_already_function(script) is True

    def test_is_script_already_function_arrow_function(self):
        """Test detection of arrow function."""
        script = '() => { console.log("test"); }'
        assert is_script_already_function(script) is True

    def test_is_script_already_function_with_parameters(self):
        """Test detection of function with parameters."""
        script = 'function(a, b) { return a + b; }'
        assert is_script_already_function(script) is True

    def test_is_script_already_function_not_function(self):
        """Test detection when script is not a function."""
        script = 'console.log("test"); return "value";'
        assert is_script_already_function(script) is False

    def test_is_script_already_function_with_whitespace(self):
        """Test detection with leading/trailing whitespace."""
        script = '   function() { test(); }   '
        assert is_script_already_function(script) is True

    def test_has_return_outside_function_simple_return(self):
        """Test detection of simple return statement."""
        script = 'return document.title;'
        assert has_return_outside_function(script) is True

    def test_has_return_outside_function_no_return(self):
        """Test when script has no return statement."""
        script = 'console.log("test"); var x = 5;'
        assert has_return_outside_function(script) is False

    def test_has_return_outside_function_return_inside_function(self):
        """Test when return is inside a function."""
        script = '''
        function getTitle() {
            return document.title;
        }
        getTitle();
        '''
        assert has_return_outside_function(script) is False

    def test_has_return_outside_function_mixed_returns(self):
        """Test with both inside and outside returns."""
        script = '''
        function inner() {
            return "inner";
        }
        return "outer";
        '''
        assert has_return_outside_function(script) is True

    def test_has_return_outside_function_already_function(self):
        """Test when script is already a function."""
        script = 'function() { return "test"; }'
        assert has_return_outside_function(script) is False

    def test_has_return_outside_function_with_comments(self):
        """Test with comments containing 'return'."""
        script = '''
        // This comment has return in it
        var message = "This string has return in it";
        /* This block comment also has return */
        return "actual return";
        '''
        assert has_return_outside_function(script) is True

    def test_has_return_outside_function_nested_braces(self):
        """Test with nested braces and complex structure."""
        script = '''
        if (true) {
            var obj = {
                method: function() {
                    return "nested";
                }
            };
        }
        return "outside";
        '''
        assert has_return_outside_function(script) is True

    def test_has_return_outside_function_arrow_function(self):
        """Test with arrow function containing return."""
        script = '''
        var func = () => {
            return "arrow";
        };
        func();
        '''
        assert has_return_outside_function(script) is False

    def test_extract_text_without_strip_without_separator(self):
        html = ('<div>Hello <span> world </span><script>alert(1)</script><style>body { color: red; }</style>'
                '<template>hidden</template></div>')
        result = extract_text_from_html(html)
        assert result == 'Hello  world '

    def test_extract_text_with_strip_without_separator(self):
        html = ('<div>Hello <span> world </span><script>alert(1)</script><style>body { color: red; }</style>'
                '<template>hidden</template></div>')
        result = extract_text_from_html(html, strip=True)
        assert result == 'Helloworld'

    def test_extract_text_without_strip_with_separator(self):
        html = ('<div>Hello <span> world </span><script>alert(1)</script><style>body { color: red; }</style>'
                '<template>hidden</template></div>')
        result = extract_text_from_html(html, separator="/")
        assert result == 'Hello / world '

    def test_extract_text_with_strip_with_separator(self):
        html = ('<div>Hello <span> world </span><script>alert(1)</script><style>body { color: red; }</style>'
                '<template>hidden</template></div>')
        result = extract_text_from_html(html, strip=True, separator="/")
        assert result == 'Hello/world'


================================================
FILE: tests/test_web_element.py
================================================
import asyncio
import json
from pathlib import Path
from unittest.mock import AsyncMock, patch

import pytest
import pytest_asyncio

from pydoll.browser.options import ChromiumOptions as Options
from pydoll.browser.chromium.chrome import Chrome
from pydoll.commands import DomCommands, RuntimeCommands
from pydoll.constants import Key
from pydoll.elements.web_element import WebElement
from pydoll.exceptions import (
    ElementNotAFileInput,
    ElementNotFound,
    ElementNotInteractable,
    ElementNotVisible,
    WaitElementTimeout,
)
from pydoll.protocol.input.types import KeyModifier
from pydoll.protocol.runtime.types import CallArgument


@pytest_asyncio.fixture
async def mock_connection_handler():
    """Mock connection handler for WebElement tests."""
    with patch('pydoll.connection.ConnectionHandler', autospec=True) as mock:
        handler = mock.return_value
        handler.execute_command = AsyncMock()
        yield handler


@pytest.fixture
def web_element(mock_connection_handler):
    """Basic WebElement fixture with common attributes."""
    attributes_list = [
        'id',
        'test-id',
        'class',
        'test-class',
        'value',
        'test-value',
        'tag_name',
        'div',
        'type',
        'text',
    ]
    return WebElement(
        object_id='test-object-id',
        connection_handler=mock_connection_handler,
        method='css',
        selector='#test',
        attributes_list=attributes_list,
    )


@pytest.fixture
def input_element(mock_connection_handler):
    """Input element fixture for form-related tests."""
    attributes_list = [
        'id',
        'input-id',
        'tag_name',
        'input',
        'type',
        'text',
        'value',
        'initial-value',
    ]
    return WebElement(
        object_id='input-object-id',
        connection_handler=mock_connection_handler,
        method='css',
        selector='input[type="text"]',
        attributes_list=attributes_list,
    )


@pytest.fixture
def file_input_element(mock_connection_handler):
    """File input element fixture for file upload tests."""
    attributes_list = ['id', 'file-input-id', 'tag_name', 'input', 'type', 'file']
    return WebElement(
        object_id='file-input-object-id',
        connection_handler=mock_connection_handler,
        method='css',
        selector='input[type="file"]',
        attributes_list=attributes_list,
    )


@pytest.fixture
def option_element(mock_connection_handler):
    """Option element fixture for dropdown tests."""
    attributes_list = ['tag_name', 'option', 'value', 'option-value', 'id', 'option-id']
    return WebElement(
        object_id='option-object-id',
        connection_handler=mock_connection_handler,
        method='css',
        selector='option[value="option-value"]',
        attributes_list=attributes_list,
    )


@pytest.fixture
def disabled_element(mock_connection_handler):
    """Disabled element fixture for testing enabled/disabled state."""
    attributes_list = ['id', 'disabled-id', 'tag_name', 'button', 'disabled', 'true']
    return WebElement(
        object_id='disabled-object-id',
        connection_handler=mock_connection_handler,
        method='css',
        selector='button:disabled',
        attributes_list=attributes_list,
    )


@pytest.fixture
def iframe_element(mock_connection_handler):
    """Iframe element fixture for iframe-related tests."""
    attributes_list = ['id', 'iframe-id', 'tag_name', 'iframe']
    return WebElement(
        object_id='iframe-object-id',
        connection_handler=mock_connection_handler,
        method='css',
        selector='iframe#iframe-id',
        attributes_list=attributes_list,
    )


class TestWebElementInitialization:
    """Test WebElement initialization and basic properties."""

    def test_web_element_initialization(self, web_element):
        """Test basic WebElement initialization."""
        assert web_element._object_id == 'test-object-id'
        assert web_element._search_method == 'css'
        assert web_element._selector == '#test'
        assert web_element._attributes == {
            'id': 'test-id',
            'class_name': 'test-class',
            'value': 'test-value',
            'tag_name': 'div',
            'type': 'text',
        }

    def test_web_element_initialization_empty_attributes(self, mock_connection_handler):
        """Test WebElement initialization with empty attributes list."""
        element = WebElement(
            object_id='empty-id', connection_handler=mock_connection_handler, attributes_list=[]
        )
        assert element._attributes == {}
        assert element._search_method is None
        assert element._selector is None

    def test_web_element_initialization_odd_attributes(self, mock_connection_handler):
        """Test WebElement initialization with odd number of attributes (causes IndexError)."""
        attributes_list = ['id', 'test-id', 'class']  # Missing value for 'class'

        # This should raise IndexError because _def_attributes doesn't handle odd lists
        with pytest.raises(IndexError):
            WebElement(
                object_id='odd-id',
                connection_handler=mock_connection_handler,
                attributes_list=attributes_list,
            )

    def test_class_attribute_renamed_to_class_name(self, mock_connection_handler):
        """Test that 'class' attribute is renamed to 'class_name'."""
        attributes_list = ['class', 'my-class', 'id', 'my-id']
        element = WebElement(
            object_id='class-test',
            connection_handler=mock_connection_handler,
            attributes_list=attributes_list,
        )
        assert 'class' not in element._attributes
        assert element._attributes['class_name'] == 'my-class'
        assert element._attributes['id'] == 'my-id'


class TestWebElementProperties:
    """Test WebElement properties and getters."""

    def test_basic_properties(self, web_element):
        """Test basic property accessors."""
        assert web_element.value == 'test-value'
        assert web_element.class_name == 'test-class'
        assert web_element.id == 'test-id'
        assert web_element.tag_name == 'div'

    def test_is_iframe_property_with_iframe_tag(self, iframe_element):
        """Test is_iframe returns True for iframe tag."""
        assert iframe_element.is_iframe is True

    def test_is_iframe_property_with_frame_tag(self, mock_connection_handler):
        """Test is_iframe returns True for frame tag (frameset frames)."""
        element = WebElement(
            object_id='frame-object-id',
            connection_handler=mock_connection_handler,
            attributes_list=['tag_name', 'frame', 'id', 'my-frame'],
        )
        assert element.is_iframe is True

    def test_is_iframe_property_with_regular_tag(self, web_element):
        """Test is_iframe returns False for non-frame tags."""
        assert web_element.is_iframe is False

    def test_is_iframe_property_with_no_tag(self, mock_connection_handler):
        """Test is_iframe returns False when tag_name is None."""
        element = WebElement(
            object_id='no-tag',
            connection_handler=mock_connection_handler,
            attributes_list=[],
        )
        assert element.is_iframe is False

    def test_is_enabled_property(self, web_element, disabled_element):
        """Test is_enabled property for enabled and disabled elements."""
        assert web_element.is_enabled is True
        assert disabled_element.is_enabled is False

    def test_properties_with_none_values(self, mock_connection_handler):
        """Test properties when attributes are not present."""
        element = WebElement(
            object_id='empty-element',
            connection_handler=mock_connection_handler,
            attributes_list=[],
        )
        assert element.value is None
        assert element.class_name is None
        assert element.id is None
        assert element.tag_name is None
        assert element.is_enabled is True  # No 'disabled' attribute means enabled

    @pytest.mark.asyncio
    async def test_text_property(self, web_element):
        """Test text property extraction from HTML."""
        test_html = '<div>Hello <span>World</span></div>'
        web_element._connection_handler.execute_command.return_value = {
            'result': {'outerHTML': test_html}
        }

        text = await web_element.text
        assert text == 'HelloWorld'  # BeautifulSoup strips spaces between elements

    @pytest.mark.asyncio
    async def test_text_property_with_nested_elements(self, web_element):
        """Test text property with complex nested HTML."""
        test_html = '<div>Text <b>Bold</b> <i>Italic</i> More text</div>'
        web_element._connection_handler.execute_command.return_value = {
            'result': {'outerHTML': test_html}
        }

        text = await web_element.text
        assert text == 'TextBoldItalicMore text'  # BeautifulSoup strips spaces between elements

    @pytest.mark.asyncio
    async def test_bounds_property(self, web_element):
        """Test bounds property returns correct coordinates."""
        expected_bounds = [0, 0, 100, 100, 100, 100, 0, 100]
        web_element._connection_handler.execute_command.return_value = {
            'result': {'model': {'content': expected_bounds}}
        }

        bounds = await web_element.bounds
        assert bounds == expected_bounds

    @pytest.mark.asyncio
    async def test_inner_html_property(self, web_element):
        """Test inner_html property returns outer HTML."""
        expected_html = '<div class="test">Content</div>'
        web_element._connection_handler.execute_command.return_value = {
            'result': {'outerHTML': expected_html}
        }

        html = await web_element.inner_html
        assert html == expected_html

    @pytest.mark.asyncio
    async def test_iframe_context_non_iframe_returns_none(self, web_element):
        """Non-iframe elements should not produce iframe context."""
        result = await web_element.iframe_context
        assert result is None
        web_element._connection_handler.execute_command.assert_not_awaited()


class TestWebElementMethods:
    """Test WebElement methods and interactions."""

    def test_get_attribute(self, web_element):
        """Test get_attribute method."""
        assert web_element.get_attribute('id') == 'test-id'
        assert web_element.get_attribute('class_name') == 'test-class'
        assert web_element.get_attribute('nonexistent') is None

    @pytest.mark.asyncio
    async def test_get_bounds_using_js(self, web_element):
        """Test JavaScript-based bounds calculation."""
        expected_bounds = {'x': 10, 'y': 20, 'width': 100, 'height': 50}
        web_element._connection_handler.execute_command.return_value = {
            'result': {'result': {'value': json.dumps(expected_bounds)}}
        }

        bounds = await web_element.get_bounds_using_js()
        assert bounds == expected_bounds

    @pytest.mark.asyncio
    async def test_scroll_into_view(self, web_element):
        """Test scroll_into_view method."""
        await web_element.scroll_into_view()
        web_element._connection_handler.execute_command.assert_called_once()

    @pytest.mark.asyncio
    async def test_insert_text(self, input_element):
        """Test insert_text method."""
        test_text = 'Hello World'
        await input_element.insert_text(test_text)

        input_element._connection_handler.execute_command.assert_called_once()

    @pytest.mark.asyncio
    async def test_type_text(self, input_element):
        """Test type_text method with character-by-character typing."""
        test_text = 'Hi'
        input_element.click = AsyncMock()
        with patch('asyncio.sleep') as mock_sleep:
            await input_element.type_text(test_text, humanize=False, interval=0.05)

        # Should call execute_command for each character (focus + KEY_DOWN + KEY_UP)
        assert input_element._connection_handler.execute_command.call_count == len(test_text) * 3
        assert input_element.click.call_count == 1

        # Verify sleep was called between characters
        assert mock_sleep.call_count == len(test_text)
        mock_sleep.assert_called_with(0.05)

    @pytest.mark.asyncio
    async def test_type_text_default_interval(self, input_element):
        """Test type_text with default interval."""
        test_text = 'A'
        input_element.click = AsyncMock()
        with patch('asyncio.sleep') as mock_sleep:
            await input_element.type_text(test_text, humanize=False)

        mock_sleep.assert_called_with(0.05)  # Default interval
        assert input_element.click.call_count == 1

    @pytest.mark.asyncio
    async def test_clear(self, input_element):
        """Test clear method resets element value."""
        input_element._connection_handler.execute_command.return_value = {
            'result': {'result': {'value': True}}
        }

        await input_element.clear()

        input_element._connection_handler.execute_command.assert_called_once()
        assert input_element._attributes['value'] == ''

    @pytest.mark.asyncio
    async def test_clear_not_interactable(self, input_element):
        """Test clear raises ElementNotInteractable for non-editable elements."""
        input_element._connection_handler.execute_command.return_value = {
            'result': {'result': {'value': False}}
        }

        with pytest.raises(ElementNotInteractable):
            await input_element.clear()


class TestWebElementIFrame:
    """Tests for iframe-specific WebElement behaviour."""

    @pytest.mark.asyncio
    async def test_iframe_context_initialization(self, iframe_element):
        """Iframe context should be created via CDP commands."""

        async def side_effect(command, timeout=60):
            method = command['method']
            if method == 'DOM.describeNode':
                return {
                    'result': {
                        'node': {
                            'frameId': 'frame-123',
                            'contentDocument': {
                                'frameId': 'frame-123',
                                'documentURL': 'https://example.com/frame.html',
                                'baseURL': 'https://example.com/frame.html',
                            },
                        }
                    }
                }
            if method == 'Page.createIsolatedWorld':
                return {'result': {'executionContextId': 42}}
            if method == 'Runtime.evaluate':
                return {
                    'result': {
                        'result': {
                            'type': 'object',
                            'objectId': 'document-object-id',
                        }
                    }
                }
            raise AssertionError(f'Unexpected method {method}')

        iframe_element._connection_handler.execute_command.side_effect = side_effect

        ctx = await iframe_element.iframe_context
        assert ctx is not None
        assert ctx.frame_id == 'frame-123'
        assert ctx.document_url == 'https://example.com/frame.html'
        assert ctx.execution_context_id == 42
        assert ctx.document_object_id == 'document-object-id'

        # Subsequent access should re-resolve (no caching) to avoid stale contexts
        ctx2 = await iframe_element.iframe_context
        assert ctx2 is not ctx
        assert ctx2.frame_id == ctx.frame_id
        assert ctx2.execution_context_id == ctx.execution_context_id

    @pytest.mark.asyncio
    async def test_iframe_inner_html_uses_runtime_evaluate(self, iframe_element):
        """inner_html should read from iframe execution context."""
        async def side_effect(command, timeout=60):
            method = command['method']
            if method == 'DOM.describeNode':
                return {
                    'result': {
                        'node': {
                            'frameId': 'frame-123',
                            'contentDocument': {
                                'frameId': 'frame-123',
                                'documentURL': 'https://example.com/frame.html',
                                'baseURL': 'https://example.com/frame.html',
                            },
                        }
                    }
                }
            if method == 'Page.createIsolatedWorld':
                return {'result': {'executionContextId': 77}}
            if method == 'Runtime.evaluate':
                expression = command['params']['expression']
                if expression == 'document.documentElement':
                    return {
                        'result': {
                            'result': {
                                'type': 'object',
                                'objectId': 'document-object-id',
                            }
                        }
                    }
                if expression == 'document.documentElement.outerHTML':
                    assert command['params']['contextId'] == 77
                    return {
                        'result': {
                            'result': {
                                'type': 'string',
                                'value': '<html>iframe content</html>',
                            }
                        }
                    }
            raise AssertionError(f'Unexpected method {method}')

        iframe_element._connection_handler.execute_command.side_effect = side_effect

        html = await iframe_element.inner_html
        assert html == '<html>iframe content</html>'

        methods = [
            call.args[0]['method']
            for call in iframe_element._connection_handler.execute_command.await_args_list
        ]
        assert methods.count('DOM.describeNode') == 1
        assert methods.count('Page.createIsolatedWorld') == 1
        assert methods.count('Runtime.evaluate') == 2

    @pytest.mark.asyncio
    async def test_find_within_iframe_uses_document_context(self, iframe_element):
        """find() should query against the iframe's document element."""

        async def side_effect(command, timeout=60):
            method = command['method']
            if method == 'DOM.describeNode':
                object_id = command['params'].get('objectId')
                if object_id == 'iframe-object-id':
                    return {
                        'result': {
                            'node': {
                                'frameId': 'frame-123',
                                'contentDocument': {
                                    'frameId': 'frame-123',
                                    'documentURL': 'https://example.com/frame.html',
                                    'baseURL': 'https://example.com/frame.html',
                                },
                            }
                        }
                    }
                if object_id == 'element-object-id':
                    return {
                        'result': {
                            'node': {
                                'nodeName': 'DIV',
                                'attributes': ['id', 'child', 'data-test', 'value'],
                            }
                        }
                    }
                raise AssertionError('Unexpected objectId in describeNode')
            if method == 'Page.createIsolatedWorld':
                return {'result': {'executionContextId': 88}}
            if method == 'Runtime.evaluate':
                expression = command['params']['expression']
                if expression == 'document.documentElement':
                    return {
                        'result': {
                            'result': {
                                'type': 'object',
                                'objectId': 'document-object-id',
                            }
                        }
                    }
                raise AssertionError(f'Unexpected evaluate expression: {expression}')
            if method == 'Runtime.callFunctionOn':
                assert command['params']['objectId'] == 'document-object-id'
                return {
                    'result': {
                        'result': {
                            'type': 'object',
                            'objectId': 'element-object-id',
                        }
                    }
                }
            raise AssertionError(f'Unexpected method {method}')

        iframe_element._connection_handler.execute_command.side_effect = side_effect

        result = await iframe_element.find(tag_name='div')

        assert isinstance(result, WebElement)
        assert result._object_id == 'element-object-id'

        runtime_calls = [
            call.args[0]
            for call in iframe_element._connection_handler.execute_command.await_args_list
            if call.args[0]['method'] == 'Runtime.callFunctionOn'
        ]
        assert runtime_calls, 'Runtime.callFunctionOn should be used for iframe queries'
        assert runtime_calls[0]['params']['objectId'] == 'document-object-id'

    @pytest.mark.asyncio
    async def test_get_parent_element_success(self, web_element):
        """Test successful parent element retrieval."""
        script_response = {'result': {'result': {'objectId': 'parent-object-id'}}}
        describe_response = {
            'result': {
                'node': {
                    'nodeName': 'DIV',
                    'attributes': ['id', 'parent-container', 'class', 'container'],
                }
            }
        }
        web_element._connection_handler.execute_command.side_effect = [
            script_response,  # Script execution
            describe_response,  # Describe node
        ]

        parent_element = await web_element.get_parent_element()

        assert isinstance(parent_element, WebElement)
        assert parent_element._object_id == 'parent-object-id'
        assert parent_element._attributes == {
            'id': 'parent-container',
            'class_name': 'container',
            'tag_name': 'div',
        }
        web_element._connection_handler.execute_command.assert_called()

    @pytest.mark.asyncio
    async def test_get_parent_element_not_found(self, web_element):
        """Test parent element not found raises ElementNotFound."""
        script_response = {'result': {'result': {}}}  # No objectId

        web_element._connection_handler.execute_command.return_value = script_response

        with pytest.raises(ElementNotFound, match='Parent element not found for element:'):
            await web_element.get_parent_element()

    @pytest.mark.asyncio
    async def test_get_parent_element_with_complex_attributes(self, web_element):
        """Test parent element with complex attribute list."""
        script_response = {'result': {'result': {'objectId': 'complex-parent-id'}}}

        describe_response = {
            'result': {
                'node': {
                    'nodeName': 'SECTION',
                    'attributes': [
                        'id',
                        'main-section',
                        'class',
                        'content-wrapper',
                        'data-testid',
                        'parent-element',
                        'aria-label',
                        'Main content area',
                    ],
                }
            }
        }

        web_element._connection_handler.execute_command.side_effect = [
            script_response,
            describe_response,
        ]

        parent_element = await web_element.get_parent_element()

        assert isinstance(parent_element, WebElement)
        assert parent_element._object_id == 'complex-parent-id'
        assert parent_element._attributes == {
            'id': 'main-section',
            'class_name': 'content-wrapper',
            'data-testid': 'parent-element',
            'aria-label': 'Main content area',
            'tag_name': 'section',
        }

    @pytest.mark.asyncio
    async def test_get_parent_element_root_element(self, web_element):
        """Test getting parent of root element (should return document body)."""
        script_response = {'result': {'result': {'objectId': 'body-object-id'}}}

        describe_response = {
            'result': {'node': {'nodeName': 'BODY', 'attributes': ['class', 'page-body']}}
        }

        web_element._connection_handler.execute_command.side_effect = [
            script_response,
            describe_response,
        ]

        parent_element = await web_element.get_parent_element()

        assert isinstance(parent_element, WebElement)
        assert parent_element._object_id == 'body-object-id'
        assert parent_element._attributes == {'class_name': 'page-body', 'tag_name': 'body'}


class TestWebElementKeyboardInteraction:
    """Test keyboard interaction methods."""

    @pytest.mark.asyncio
    async def test_key_down(self, web_element):
        """Test key_down method."""
        key = Key.ENTER
        modifiers = KeyModifier.CTRL

        await web_element.key_down(key, modifiers)

        web_element._connection_handler.execute_command.assert_called_once()

    @pytest.mark.asyncio
    async def test_key_down_without_modifiers(self, web_element):
        """Test key_down without modifiers."""
        key = Key.TAB

        await web_element.key_down(key)

        web_element._connection_handler.execute_command.assert_called_once()

    @pytest.mark.asyncio
    async def test_key_up(self, web_element):
        """Test key_up method."""
        key = Key.ESCAPE

        await web_element.key_up(key)

        web_element._connection_handler.execute_command.assert_called_once()

    @pytest.mark.asyncio
    async def test_press_keyboard_key(self, web_element):
        """Test press_keyboard_key method (key down + up)."""
        key = Key.SPACE
        modifiers = KeyModifier.SHIFT

        with patch('asyncio.sleep') as mock_sleep:
            await web_element.press_keyboard_key(key, modifiers, interval=0.05)

        # Should call key_down and key_up
        assert web_element._connection_handler.execute_command.call_count == 2
        mock_sleep.assert_called_once_with(0.05)

    @pytest.mark.asyncio
    async def test_press_keyboard_key_default_interval(self, web_element):
        """Test press_keyboard_key with default interval."""
        key = Key.ENTER

        with patch('asyncio.sleep') as mock_sleep:
            await web_element.press_keyboard_key(key)

        mock_sleep.assert_called_once_with(0.1)


class TestWebElementClicking:
    """Test clicking methods and behaviors."""

    @pytest.mark.asyncio
    async def test_click_using_js_success(self, web_element):
        """Test successful JavaScript click."""
        # Mock element visibility and click success
        web_element.is_visible = AsyncMock(return_value=True)
        web_element.scroll_into_view = AsyncMock()
        web_element.execute_script = AsyncMock(return_value={'result': {'result': {'value': True}}})

        await web_element.click_using_js()

        web_element.scroll_into_view.assert_called_once()
        web_element.is_visible.assert_called_once()

    @pytest.mark.asyncio
    async def test_click_using_js_not_visible(self, web_element):
        """Test JavaScript click when element is not visible."""
        web_element.is_visible = AsyncMock(return_value=False)
        web_element.scroll_into_view = AsyncMock()

        with pytest.raises(ElementNotVisible):
            await web_element.click_using_js()

    @pytest.mark.asyncio
    async def test_click_using_js_not_interactable(self, web_element):
        """Test JavaScript click when element is not interactable."""
        web_element.is_visible = AsyncMock(return_value=True)
        web_element.scroll_into_view = AsyncMock()
        web_element.execute_script = AsyncMock(
            return_value={'result': {'result': {'value': False}}}
        )

        with pytest.raises(ElementNotInteractable):
            await web_element.click_using_js()

    @pytest.mark.asyncio
    async def test_click_using_js_option_element(self, option_element):
        """Test JavaScript click on option element uses specialized method."""
        option_element._click_option_tag = AsyncMock()

        await option_element.click_using_js()

        option_element._click_option_tag.assert_called_once()

    @pytest.mark.asyncio
    async def test_click_success(self, web_element):
        """Test successful mouse click."""
        bounds = [0, 0, 100, 0, 100, 100, 0, 100]  # Rectangle coordinates
        web_element.is_visible = AsyncMock(return_value=True)
        web_element.scroll_into_view = AsyncMock()
        web_element._connection_handler.execute_command.side_effect = [
            {'result': {'model': {'content': bounds}}},  # bounds
            None,  # mouse press
            None,  # mouse release
        ]

        with patch('asyncio.sleep') as mock_sleep:
            await web_element.click(x_offset=5, y_offset=10, hold_time=0.2)

        # Should call mouse press and release
        assert web_element._connection_handler.execute_command.call_count == 3
        mock_sleep.assert_called_once_with(0.2)

    @pytest.mark.asyncio
    async def test_click_not_visible(self, web_element):
        """Test click when element is not visible."""
        web_element.is_visible = AsyncMock(return_value=False)

        with pytest.raises(ElementNotVisible):
            await web_element.click()

    @pytest.mark.asyncio
    async def test_click_option_element(self, option_element):
        """Test click on option element uses specialized method."""
        option_element._click_option_tag = AsyncMock()

        await option_element.click()

        option_element._click_option_tag.assert_called_once()

    @pytest.mark.asyncio
    async def test_click_bounds_fallback_to_js(self, web_element):
        """Test click falls back to JS bounds when CDP bounds fail."""
        web_element.is_visible = AsyncMock(return_value=True)
        web_element.scroll_into_view = AsyncMock()

        # First call (bounds) raises KeyError, second call (JS bounds) succeeds
        js_bounds = {'x': 10, 'y': 20, 'width': 100, 'height': 50}
        web_element._connection_handler.execute_command.side_effect = [
            {'result': {'model': {'invalid_key': []}}},  # bounds with KeyError
            {'result': {'result': {'value': json.dumps(js_bounds)}}},  # JS bounds
            None,  # mouse press
            None,  # mouse release
        ]

        await web_element.click()

        # Should call bounds, JS bounds, mouse press, and mouse release
        assert web_element._connection_handler.execute_command.call_count == 4

    @pytest.mark.asyncio
    async def test_click_option_tag_method(self, option_element):
        """Test _click_option_tag method."""
        await option_element._click_option_tag()

        # Should execute script with option value
        option_element._connection_handler.execute_command.assert_called_once()


class TestWebElementHumanizedClick:
    """Test WebElement.click() humanized behavior via Mouse API."""

    @pytest.fixture
    def mouse_mock(self):
        mock = AsyncMock()
        mock.click = AsyncMock()
        return mock

    @pytest.fixture
    def element_with_mouse(self, mock_connection_handler, mouse_mock):
        attributes_list = ['id', 'btn-1', 'tag_name', 'button']
        elem = WebElement(
            object_id='obj-1',
            connection_handler=mock_connection_handler,
            method='css',
            selector='#btn-1',
            attributes_list=attributes_list,
            mouse=mouse_mock,
        )
        return elem

    @pytest.mark.asyncio
    async def test_click_humanized_uses_mouse(self, element_with_mouse, mouse_mock):
        """When humanize=True and mouse is set, mouse.click() is called."""
        bounds = [0, 0, 100, 0, 100, 100, 0, 100]
        element_with_mouse.is_visible = AsyncMock(return_value=True)
        element_with_mouse.scroll_into_view = AsyncMock()
        element_with_mouse._connection_handler.execute_command.return_value = {
            'result': {'model': {'content': bounds}}
        }

        await element_with_mouse.click(humanize=True)

        mouse_mock.click.assert_called_once_with(50.0, 50.0)

    @pytest.mark.asyncio
    async def test_click_humanized_with_offset(self, element_with_mouse, mouse_mock):
        """Offset is applied before passing to mouse.click()."""
        bounds = [0, 0, 100, 0, 100, 100, 0, 100]
        element_with_mouse.is_visible = AsyncMock(return_value=True)
        element_with_mouse.scroll_into_view = AsyncMock()
        element_with_mouse._connection_handler.execute_command.return_value = {
            'result': {'model': {'content': bounds}}
        }

        await element_with_mouse.click(x_offset=10, y_offset=20, humanize=True)

        mouse_mock.click.assert_called_once_with(60.0, 70.0)

    @pytest.mark.asyncio
    async def test_click_humanize_false_uses_raw_cdp(self, element_with_mouse, mouse_mock):
        """When humanize=False, raw CDP events are used even if mouse is set."""
        bounds = [0, 0, 100, 0, 100, 100, 0, 100]
        element_with_mouse.is_visible = AsyncMock(return_value=True)
        element_with_mouse.scroll_into_view = AsyncMock()
        element_with_mouse._connection_handler.execute_command.side_effect = [
            {'result': {'model': {'content': bounds}}},
            None,  # mouse press
            None,  # mouse release
        ]

        with patch('asyncio.sleep'):
            await element_with_mouse.click(humanize=False)

        mouse_mock.click.assert_not_called()
        assert element_with_mouse._connection_handler.execute_command.call_count == 3

    @pytest.mark.asyncio
    async def test_click_no_mouse_falls_through(self, web_element):
        """When _mouse is None, raw CDP fallback is used."""
        assert web_element._mouse is None
        bounds = [0, 0, 100, 0, 100, 100, 0, 100]
        web_element.is_visible = AsyncMock(return_value=True)
        web_element.scroll_into_view = AsyncMock()
        web_element._connection_handler.execute_command.side_effect = [
            {'result': {'model': {'content': bounds}}},
            None,  # mouse press
            None,  # mouse release
        ]

        with patch('asyncio.sleep'):
            await web_element.click()

        assert web_element._connection_handler.execute_command.call_count == 3

    @pytest.mark.asyncio
    async def test_click_humanized_iframe_element_skips_mouse(
        self, element_with_mouse, mouse_mock
    ):
        """When element has iframe context, humanized click falls back to CDP."""
        from pydoll.interactions.iframe import IFrameContext

        bounds = [0, 0, 100, 0, 100, 100, 0, 100]
        element_with_mouse.is_visible = AsyncMock(return_value=True)
        element_with_mouse.scroll_into_view = AsyncMock()
        element_with_mouse._iframe_context = IFrameContext(frame_id='frame-123')
        element_with_mouse._connection_handler.execute_command.side_effect = [
            {'result': {'model': {'content': bounds}}},
            None,  # mouse press
            None,  # mouse release
        ]

        with patch('asyncio.sleep'):
            await element_with_mouse.click(humanize=True)

        mouse_mock.click.assert_not_called()
        assert element_with_mouse._connection_handler.execute_command.call_count == 3

    @pytest.mark.asyncio
    async def test_click_option_element_skips_mouse(self, mouse_mock, mock_connection_handler):
        """Option elements use JS click path regardless of mouse."""
        attributes_list = ['tag_name', 'option', 'value', 'opt-1']
        elem = WebElement(
            object_id='opt-obj',
            connection_handler=mock_connection_handler,
            attributes_list=attributes_list,
            mouse=mouse_mock,
        )
        elem._click_option_tag = AsyncMock()

        await elem.click()

        elem._click_option_tag.assert_called_once()
        mouse_mock.click.assert_not_called()


class TestWebElementFileInput:
    """Test file input specific functionality."""

    @pytest.mark.asyncio
    async def test_set_input_files_success(self, file_input_element):
        """Test successful file input setting."""
        files = ['/path/to/file1.txt', '/path/to/file2.pdf']

        await file_input_element.set_input_files(files)

        file_input_element._connection_handler.execute_command.assert_called_once()

    @pytest.mark.asyncio
    async def test_set_input_files_not_file_input(self, web_element):
        """Test set_input_files on non-file input element."""
        files = ['/path/to/file.txt']

        with pytest.raises(ElementNotAFileInput):
            await web_element.set_input_files(files)

    @pytest.mark.asyncio
    async def test_set_input_files_input_but_wrong_type(self, input_element):
        """Test set_input_files on input element with wrong type."""
        files = ['/path/to/file.txt']

        with pytest.raises(ElementNotAFileInput):
            await input_element.set_input_files(files)


class TestWebElementScreenshot:
    """Test screenshot functionality."""

    @pytest.mark.asyncio
    async def test_take_screenshot_success(self, web_element, tmp_path):
        """Test successful element screenshot."""
        bounds = {'x': 10, 'y': 20, 'width': 100, 'height': 50}
        screenshot_data = 'iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAQAAAC1HAwCAAAAC0lEQVR42mP8/wcAAgAB/edzE+oAAAAASUVORK5CYII='

        web_element._connection_handler.execute_command.side_effect = [
            {'result': {'result': {'value': json.dumps(bounds)}}},  # get_bounds_using_js
            {'result': {'data': screenshot_data}},  # capture_screenshot
        ]

        screenshot_path = tmp_path / 'element.jpeg'

        # Mock aiofiles.open properly for async context manager
        mock_file = AsyncMock()
        mock_file.write = AsyncMock()

        with patch('aiofiles.open') as mock_aiofiles_open:
            mock_aiofiles_open.return_value.__aenter__.return_value = mock_file
            await web_element.take_screenshot(str(screenshot_path), quality=90)

        # Should call get_bounds_using_js and capture_screenshot
        assert web_element._connection_handler.execute_command.call_count == 2

    @pytest.mark.asyncio
    async def test_take_screenshot_default_quality(self, web_element, tmp_path):
        """Test screenshot with default quality."""
        bounds = {'x': 0, 'y': 0, 'width': 50, 'height': 50}
        screenshot_data = 'iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAQAAAC1HAwCAAAAC0lEQVR42mP8/wcAAgAB/edzE+oAAAAASUVORK5CYII='
        web_element._connection_handler.execute_command.side_effect = [
            {'result': {'result': {'value': json.dumps(bounds)}}},
            {'result': {'data': screenshot_data}},
        ]

        screenshot_path = tmp_path / 'element_default.jpeg'

        # Mock aiofiles.open properly for async context manager
        mock_file = AsyncMock()
        mock_file.write = AsyncMock()

        with patch('aiofiles.open') as mock_aiofiles_open:
            mock_aiofiles_open.return_value.__aenter__.return_value = mock_file
            await web_element.take_screenshot(str(screenshot_path))

        # Should call get_bounds_using_js and capture_screenshot
        assert web_element._connection_handler.execute_command.call_count == 2

    @pytest.mark.asyncio
    async def test_take_screenshot_as_base64(self, web_element):
        """Test screenshot returned as base64 string."""
        bounds = {'x': 10, 'y': 20, 'width': 100, 'height': 50}
        screenshot_data = 'iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAQAAAC1HAwCAAAAC0lEQVR42mP8/wcAAgAB/edzE+oAAAAASUVORK5CYII='

        web_element._connection_handler.execute_command.side_effect = [
            {'result': {'result': {'value': json.dumps(bounds)}}},  # get_bounds_using_js
            {'result': {'data': screenshot_data}},  # capture_screenshot
        ]

        # Take screenshot as base64
        result = await web_element.take_screenshot(as_base64=True)

        # Should return the base64 data
        assert result == screenshot_data
        # Should call get_bounds_using_js and capture_screenshot
        assert web_element._connection_handler.execute_command.call_count == 2

    @pytest.mark.asyncio
    async def test_take_screenshot_missing_path_without_base64(self, web_element):
        """Test screenshot raises error when no path and as_base64=False."""
        from pydoll.exceptions import MissingScreenshotPath

        with pytest.raises(MissingScreenshotPath):
            await web_element.take_screenshot(as_base64=False)

    @pytest.mark.asyncio
    async def test_take_screenshot_jpg_alias(self, web_element, tmp_path):
        """Test that .jpg extension works as alias for .jpeg."""
        bounds = {'x': 10, 'y': 20, 'width': 100, 'height': 50}
        screenshot_data = 'iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAQAAAC1HAwCAAAAC0lEQVR42mP8/wcAAgAB/edzE+oAAAAASUVORK5CYII='

        web_element._connection_handler.execute_command.side_effect = [
            {'result': {'result': {'value': json.dumps(bounds)}}},  # get_bounds_using_js
            {'result': {'data': screenshot_data}},  # capture_screenshot
        ]

        screenshot_path = tmp_path / 'element.jpg'

        # Mock aiofiles.open properly for async context manager
        mock_file = AsyncMock()
        mock_file.write = AsyncMock()

        with patch('aiofiles.open') as mock_aiofiles_open:
            mock_aiofiles_open.return_value.__aenter__.return_value = mock_file
            await web_element.take_screenshot(str(screenshot_path), quality=90)

        # Should work without raising InvalidFileExtension
        assert web_element._connection_handler.execute_command.call_count == 2


class TestWebElementVisibility:
    """Test element visibility and interaction checks."""

    @pytest.mark.asyncio
    async def test_is_element_visible_true(self, web_element):
        """Test _is_element_visible returns True."""
        web_element.execute_script = AsyncMock(return_value={'result': {'result': {'value': True}}})

        result = await web_element.is_visible()
        assert result is True

    @pytest.mark.asyncio
    async def test_is_element_visible_false(self, web_element):
        """Test _is_element_visible returns False."""
        web_element.execute_script = AsyncMock(
            return_value={'result': {'result': {'value': False}}}
        )

        result = await web_element.is_visible()
        assert result is False

    @pytest.mark.asyncio
    async def test_is_element_on_top_true(self, web_element):
        """Test _is_element_on_top returns True."""
        web_element.execute_script = AsyncMock(return_value={'result': {'result': {'value': True}}})

        result = await web_element.is_on_top()
        assert result is True

    @pytest.mark.asyncio
    async def test_is_element_on_top_false(self, web_element):
        """Test _is_element_on_top returns False."""
        web_element.execute_script = AsyncMock(
            return_value={'result': {'result': {'value': False}}}
        )

        result = await web_element.is_on_top()
        assert result is False

    @pytest.mark.asyncio
    async def test_is_element_interactable_true(self, web_element):
        """Test _is_element_interactable returns True."""
        web_element.execute_script = AsyncMock(return_value={'result': {'result': {'value': True}}})

        result = await web_element.is_interactable()
        assert result is True

    @pytest.mark.asyncio
    async def test_is_element_interactable_false(self, web_element):
        """Test _is_element_interactable returns False."""
        web_element.execute_script = AsyncMock(
            return_value={'result': {'result': {'value': False}}}
        )

        result = await web_element.is_interactable()
        assert result is False


class TestWebElementWaitUntil:
    """Test wait_until method."""

    @pytest.mark.asyncio
    async def test_wait_until_visible_success(self, web_element):
        """Test wait_until succeeds when element becomes visible."""
        web_element.is_visible = AsyncMock(side_effect=[False, True])

        with patch('asyncio.sleep') as mock_sleep, patch('asyncio.get_event_loop') as mock_loop:
            mock_loop.return_value.time.side_effect = [0, 0.5]

            await web_element.wait_until(is_visible=True, timeout=2)

        assert web_element.is_visible.call_count == 2
        mock_sleep.assert_called_once_with(0.5)

    @pytest.mark.asyncio
    async def test_wait_until_visible_timeout(self, web_element):
        """Test wait_until raises WaitElementTimeout when visibility not met."""
        web_element.is_visible = AsyncMock(return_value=False)

        with patch('asyncio.sleep') as mock_sleep, patch('asyncio.get_event_loop') as mock_loop:
            mock_loop.return_value.time.side_effect = [0, 0.5, 1.0, 1.5, 2.1]

            with pytest.raises(WaitElementTimeout, match='element to become visible'):
                await web_element.wait_until(is_visible=True, timeout=2)

        assert mock_sleep.call_count == 3

    @pytest.mark.asyncio
    async def test_wait_until_interactable_success(self, web_element):
        """Test wait_until succeeds when element becomes interactable."""
        web_element.is_interactable = AsyncMock(return_value=True)

        await web_element.wait_until(is_interactable=True, timeout=1)

        web_element.is_interactable.assert_called_once()

    @pytest.mark.asyncio
    async def test_wait_until_interactable_timeout(self, web_element):
        """Test wait_until raises WaitElementTimeout when not interactable."""
        web_element.is_interactable = AsyncMock(return_value=False)

        with patch('asyncio.sleep') as mock_sleep, patch('asyncio.get_event_loop') as mock_loop:
            mock_loop.return_value.time.side_effect = [0, 0.5, 1.1]

            with pytest.raises(WaitElementTimeout, match='element to become interactable'):
                await web_element.wait_until(is_interactable=True, timeout=1)

        mock_sleep.assert_called_once_with(0.5)

    @pytest.mark.asyncio
    async def test_wait_until_visible_and_interactable(self, web_element):
        """Test wait_until requires both conditions when both are True."""
        web_element.is_visible = AsyncMock(side_effect=[False, True])
        web_element.is_interactable = AsyncMock(side_effect=[False, True])

        with patch('asyncio.sleep') as mock_sleep, patch('asyncio.get_event_loop') as mock_loop:
            mock_loop.return_value.time.side_effect = [0, 0.5, 1.0]

            await web_element.wait_until(is_visible=True, is_interactable=True, timeout=2)

        assert web_element.is_visible.call_count == 2
        assert web_element.is_interactable.call_count == 2
        mock_sleep.assert_called_once_with(0.5)

    @pytest.mark.asyncio
    async def test_wait_until_no_conditions(self, web_element):
        """Test wait_until raises ValueError when no condition specified."""
        with pytest.raises(ValueError):
            await web_element.wait_until()


class TestWebElementUtilityMethods:
    """Test utility and helper methods."""

    def test_calculate_center(self):
        """Test _calculate_center static method."""
        # Rectangle: (0,0), (100,0), (100,100), (0,100)
        bounds = [0, 0, 100, 0, 100, 100, 0, 100]
        x_center, y_center = WebElement._calculate_center(bounds)
        assert x_center == 50
        assert y_center == 50

    def test_calculate_center_irregular_shape(self):
        """Test _calculate_center with irregular coordinates."""
        # Triangle-like shape
        bounds = [0, 0, 50, 0, 25, 50]
        x_center, y_center = WebElement._calculate_center(bounds)
        assert x_center == 25  # (0 + 50 + 25) / 3
        assert y_center == pytest.approx(16.67, rel=1e-2)  # (0 + 0 + 50) / 3

    def test_is_option_tag_true(self, option_element):
        """Test _is_option_tag returns True for option elements."""
        assert option_element._is_option_tag() is True

    def test_is_option_tag_false(self, web_element):
        """Test _is_option_tag returns False for non-option elements."""
        assert web_element._is_option_tag() is False

    def test_def_attributes_empty_list(self, mock_connection_handler):
        """Test _def_attributes with empty list."""
        element = WebElement(
            object_id='test', connection_handler=mock_connection_handler, attributes_list=[]
        )
        assert element._attributes == {}

    def test_def_attributes_class_rename(self, mock_connection_handler):
        """Test _def_attributes renames 'class' to 'class_name'."""
        attributes_list = ['class', 'my-class', 'id', 'my-id']
        element = WebElement(
            object_id='test',
            connection_handler=mock_connection_handler,
            attributes_list=attributes_list,
        )
        assert element._attributes == {'class_name': 'my-class', 'id': 'my-id'}

    @pytest.mark.asyncio
    async def test_execute_script_basic(self, web_element):
        """Test execute_script basic functionality with return value."""
        script = 'return this.tagName;'
        expected_response = {'result': {'result': {'value': 'DIV'}}}
        web_element._connection_handler.execute_command.return_value = expected_response

        result = await web_element.execute_script(script, return_by_value=True)

        assert result == expected_response
        expected_command = RuntimeCommands.call_function_on(
            object_id='test-object-id',
            function_declaration='function(){ return this.tagName; }',
            return_by_value=True,
        )
        web_element._connection_handler.execute_command.assert_called_once_with(
            expected_command, timeout=60
        )

class TestBuildTextExpression:
    """Unit tests for FindElementsMixin._build_text_expression."""

    def test_build_text_expression_with_xpath(self):
        from pydoll.elements.mixins import FindElementsMixin
        expr = FindElementsMixin._build_text_expression('//p[@id="x"]', 'xpath')
        assert isinstance(expr, str)
        assert 'XPathResult.FIRST_ORDERED_NODE_TYPE' in expr
        assert '@id' in expr
        assert 'p' in expr

    def test_build_text_expression_with_name(self):
        from pydoll.elements.mixins import FindElementsMixin
        expr = FindElementsMixin._build_text_expression('fieldName', 'name')
        assert isinstance(expr, str)
        assert '//*[@name="fieldName"]' in expr

    def test_build_text_expression_with_id_css(self):
        from pydoll.elements.mixins import FindElementsMixin
        expr = FindElementsMixin._build_text_expression('main', 'id')
        assert 'document.querySelector' in expr
        assert '#main' in expr

    def test_build_text_expression_with_class_css(self):
        from pydoll.elements.mixins import FindElementsMixin
        expr = FindElementsMixin._build_text_expression('item', 'class_name')
        assert 'document.querySelector' in expr
        assert '.item' in expr

    def test_build_text_expression_with_tag_css(self):
        from pydoll.elements.mixins import FindElementsMixin
        expr = FindElementsMixin._build_text_expression('button', 'tag_name')
        assert 'document.querySelector' in expr
        assert 'button' in expr

class TestIsOptionElementHeuristics:
    """Unit tests for heuristics inside WebElement._is_option_element."""

    @pytest.mark.asyncio
    async def test_is_option_element_by_tag_attribute(self, option_element):
        assert await option_element._is_option_element() is True

    @pytest.mark.asyncio
    async def test_is_option_element_by_method_and_selector_tag_name(self, mock_connection_handler):
        dummy = WebElement('dummy', mock_connection_handler, method='tag_name', selector='option', attributes_list=[])
        assert await dummy._is_option_element() is True

    @pytest.mark.asyncio
    async def test_is_option_element_by_xpath_selector_contains_option(self, mock_connection_handler):
        dummy = WebElement('dummy', mock_connection_handler, method='xpath', selector='//OPTION[@value=\"x\"]', attributes_list=[])
        assert await dummy._is_option_element() is True
    @pytest.mark.asyncio
    async def test_execute_script_with_this_syntax(self, web_element):
        """Test execute_script method with 'this' syntax."""
        script = 'this.style.border = "2px solid red"'
        expected_response = {'result': {'result': {'value': None}}}
        web_element._connection_handler.execute_command.return_value = expected_response

        result = await web_element.execute_script(script)

        assert result == expected_response
        expected_command = RuntimeCommands.call_function_on(
            object_id='test-object-id',
            function_declaration='function(){ this.style.border = "2px solid red" }',
        )
        web_element._connection_handler.execute_command.assert_called_once_with(
            expected_command, timeout=60
        )

    @pytest.mark.asyncio
    async def test_execute_script_already_function(self, web_element):
        """Test execute_script when script is already a function."""
        script = 'function() { this.style.border = "2px solid red"; }'
        expected_response = {'result': {'result': {'value': None}}}
        web_element._connection_handler.execute_command.return_value = expected_response

        result = await web_element.execute_script(script)

        assert result == expected_response
        expected_command = RuntimeCommands.call_function_on(
            object_id='test-object-id',
            function_declaration='function() { this.style.border = "2px solid red"; }',
        )
        web_element._connection_handler.execute_command.assert_called_once_with(
            expected_command, timeout=60
        )

    @pytest.mark.asyncio
    async def test_execute_script_with_parameters(self, web_element):
        """Test execute_script with additional parameters."""
        script = 'this.value = "test"'
        expected_response = {'result': {'result': {'value': 'test'}}}
        web_element._connection_handler.execute_command.return_value = expected_response

        result = await web_element.execute_script(
            script, 
            return_by_value=True,
            user_gesture=True
        )

        assert result == expected_response
        expected_command = RuntimeCommands.call_function_on(
            object_id='test-object-id',
            function_declaration='function(){ this.value = "test" }',
            return_by_value=True,
            user_gesture=True,
        )
        web_element._connection_handler.execute_command.assert_called_once_with(
            expected_command, timeout=60
        )

    @pytest.mark.asyncio
    async def test_execute_script_arrow_function(self, web_element):
        """Test execute_script with arrow function syntax."""
        script = '() => { this.style.color = "red"; }'
        expected_response = {'result': {'result': {'value': None}}}
        web_element._connection_handler.execute_command.return_value = expected_response

        result = await web_element.execute_script(script)

        assert result == expected_response
        expected_command = RuntimeCommands.call_function_on(
            object_id='test-object-id',
            function_declaration='() => { this.style.color = "red"; }',
        )
        web_element._connection_handler.execute_command.assert_called_once_with(
            expected_command, timeout=60
        )

    @pytest.mark.asyncio
    async def test_execute_script_multiline(self, web_element):
        """Test execute_script with multiline script."""
        script = '''
            this.style.padding = "10px";
            this.style.margin = "5px";
            this.style.borderRadius = "8px";
        '''
        expected_response = {'result': {'result': {'value': None}}}
        web_element._connection_handler.execute_command.return_value = expected_response

        result = await web_element.execute_script(script)

        assert result == expected_response
        web_element._connection_handler.execute_command.assert_called_once()
        call_args = web_element._connection_handler.execute_command.call_args[0][0]
        
        assert call_args['method'].value == 'Runtime.callFunctionOn'
        assert call_args['params']['objectId'] == 'test-object-id'
        
        func_decl = call_args['params']['functionDeclaration']
        assert 'function(){' in func_decl
        assert 'this.style.padding = "10px"' in func_decl
        assert 'this.style.margin = "5px"' in func_decl
        assert 'this.style.borderRadius = "8px"' in func_decl

    @pytest.mark.asyncio
    async def test_execute_script_with_arguments(self, web_element):
        """Test execute_script with custom arguments."""
        script = 'this.value = arguments[0];'
        arguments = [CallArgument(value="test_value")]
        expected_response = {'result': {'result': {'value': None}}}
        web_element._connection_handler.execute_command.return_value = expected_response

        result = await web_element.execute_script(script, arguments=arguments)

        assert result == expected_response
        expected_command = RuntimeCommands.call_function_on(
            object_id='test-object-id',
            function_declaration='function(){ this.value = arguments[0]; }',
            arguments=arguments,
        )
        web_element._connection_handler.execute_command.assert_called_once_with(
            expected_command, timeout=60
        )

    @pytest.mark.asyncio
    async def test_execute_script_all_parameters(self, web_element):
        """Test execute_script with all optional parameters."""
        script = 'this.click()'
        expected_response = {'result': {'result': {'value': None}}}
        web_element._connection_handler.execute_command.return_value = expected_response

        result = await web_element.execute_script(
            script,
            silent=True,
            return_by_value=True,
            generate_preview=True,
            user_gesture=True,
            await_promise=True,
            execution_context_id=123,
            object_group="test_group",
            throw_on_side_effect=True,
            unique_context_id="unique_123"
        )

        assert result == expected_response
        expected_command = RuntimeCommands.call_function_on(
            object_id='test-object-id',
            function_declaration='function(){ this.click() }',
            silent=True,
            return_by_value=True,
            generate_preview=True,
            user_gesture=True,
            await_promise=True,
            execution_context_id=123,
            object_group="test_group",
            throw_on_side_effect=True,
            unique_context_id="unique_123",
        )
        web_element._connection_handler.execute_command.assert_called_once_with(
            expected_command, timeout=60
        )

    def test_repr(self, web_element):
        """Test __repr__ method."""
        repr_str = repr(web_element)
        assert 'WebElement' in repr_str
        assert 'test-object-id' in repr_str
        assert 'id=\'test-id\'' in repr_str
        assert 'class_name=\'test-class\'' in repr_str


class TestWebElementFindMethods:
    """Test element finding methods from FindElementsMixin."""

    @pytest.mark.asyncio
    async def test_find_element_success(self, web_element):
        """Test successful element finding."""
        node_response = {'result': {'result': {'objectId': 'found-element-id'}}}
        describe_response = {
            'result': {'node': {'nodeName': 'BUTTON', 'attributes': ['class', 'btn']}}
        }

        web_element._connection_handler.execute_command.side_effect = [
            node_response,
            describe_response,
        ]

        element = await web_element.find(id='button-id')

        assert isinstance(element, WebElement)
        assert element._object_id == 'found-element-id'
        assert element._attributes['class_name'] == 'btn'

    @pytest.mark.asyncio
    async def test_find_element_not_found_with_exception(self, web_element):
        """Test element not found raises exception."""
        web_element._connection_handler.execute_command.return_value = {'result': {'result': {}}}

        with pytest.raises(ElementNotFound):
            await web_element.find(id='nonexistent')

    @pytest.mark.asyncio
    async def test_find_element_not_found_no_exception(self, web_element):
        """Test element not found returns None when raise_exc=False."""
        web_element._connection_handler.execute_command.return_value = {'result': {'result': {}}}

        result = await web_element.find(id='nonexistent', raise_exc=False)
        assert result is None

    @pytest.mark.asyncio
    async def test_find_elements_success(self, web_element):
        """Test successful multiple elements finding."""
        find_response = {'result': {'result': {'objectId': 'parent-id'}}}
        properties_response = {
            'result': {
                'result': [
                    {'name': '0', 'value': {'type': 'object', 'objectId': 'child-1'}},
                    {'name': '1', 'value': {'type': 'object', 'objectId': 'child-2'}},
                ]
            }
        }
        describe_response = {
            'result': {'node': {'nodeName': 'LI', 'attributes': ['class', 'item']}}
        }

        web_element._connection_handler.execute_command.side_effect = [
            find_response,
            properties_response,
            describe_response,
            describe_response,
        ]

        elements = await web_element.find(class_name='item', find_all=True)

        assert len(elements) == 2
        assert all(isinstance(elem, WebElement) for elem in elements)
        assert elements[0]._object_id == 'child-1'
        assert elements[1]._object_id == 'child-2'

    @pytest.mark.asyncio
    async def test_find_with_timeout_success(self, web_element):
        """Test find with timeout succeeds on retry."""
        node_response = {'result': {'result': {'objectId': 'delayed-element'}}}
        describe_response = {'result': {'node': {'nodeName': 'DIV', 'attributes': []}}}

        # First call returns empty, second call succeeds
        web_element._connection_handler.execute_command.side_effect = [
            {'result': {'result': {}}},  # First attempt fails
            node_response,  # Second attempt succeeds
            describe_response,
        ]

        with patch('asyncio.sleep') as mock_sleep:
            element = await web_element.find(id='delayed', timeout=2)

        assert isinstance(element, WebElement)
        assert element._object_id == 'delayed-element'
        mock_sleep.assert_called()

    @pytest.mark.asyncio
    async def test_find_with_timeout_failure(self, web_element):
        """Test find with timeout raises WaitElementTimeout."""
        web_element._connection_handler.execute_command.return_value = {'result': {'result': {}}}

        with patch('asyncio.get_event_loop') as mock_loop:
            mock_loop.return_value.time.side_effect = [
                0,
                0.5,
                1.0,
                1.5,
                2.1,
            ]  # Simulate time progression

            with pytest.raises(WaitElementTimeout):
                await web_element.find(id='never-appears', timeout=2)

    @pytest.mark.asyncio
    async def test_query_css_selector(self, web_element):
        """Test query method with CSS selector."""
        node_response = {'result': {'result': {'objectId': 'queried-element'}}}
        describe_response = {
            'result': {'node': {'nodeName': 'A', 'attributes': ['href', 'http://example.com']}}
        }

        web_element._connection_handler.execute_command.side_effect = [
            node_response,
            describe_response,
        ]

        element = await web_element.query('a[href*="example"]')

        assert isinstance(element, WebElement)
        assert element._object_id == 'queried-element'

    @pytest.mark.asyncio
    async def test_query_xpath(self, web_element):
        """Test query method with XPath expression."""
        node_response = {'result': {'result': {'objectId': 'xpath-element'}}}
        describe_response = {'result': {'node': {'nodeName': 'SPAN', 'attributes': []}}}

        web_element._connection_handler.execute_command.side_effect = [
            node_response,
            describe_response,
        ]

        element = await web_element.query('//span[text()="Click me"]')

        assert isinstance(element, WebElement)
        assert element._object_id == 'xpath-element'

    def test_find_no_criteria_raises_error(self, web_element):
        """Test find with no search criteria raises ValueError."""
        with pytest.raises(
            ValueError, match='At least one of the following arguments must be provided'
        ):
            asyncio.run(web_element.find())


class TestWebElementEdgeCases:
    """Test edge cases and error conditions."""

    @pytest.mark.asyncio
    async def test_bounds_property_with_connection_error(self, web_element):
        """Test bounds property when connection fails."""
        web_element._connection_handler.execute_command.side_effect = Exception("Connection failed")

        with pytest.raises(Exception, match="Connection failed"):
            await web_element.bounds

    @pytest.mark.asyncio
    async def test_text_property_with_malformed_html(self, web_element):
        """Test text property with malformed HTML."""
        malformed_html = '<div>Unclosed tag <span>content'
        web_element._connection_handler.execute_command.return_value = {
            'result': {'outerHTML': malformed_html}
        }

        # BeautifulSoup should handle malformed HTML gracefully
        text = await web_element.text
        assert 'Unclosed tag' in text
        assert 'content' in text

    @pytest.mark.asyncio
    async def test_click_with_zero_hold_time(self, web_element):
        """Test click with zero hold time."""
        bounds = [0, 0, 50, 0, 50, 50, 0, 50]
        web_element.is_visible = AsyncMock(return_value=True)
        web_element.scroll_into_view = AsyncMock()
        web_element._connection_handler.execute_command.side_effect = [
            {'result': {'model': {'content': bounds}}},
            None,  # mouse press
            None,  # mouse release
        ]

        with patch('asyncio.sleep') as mock_sleep:
            await web_element.click(hold_time=0)

        mock_sleep.assert_called_once_with(0)

    @pytest.mark.asyncio
    async def test_type_text_empty_string(self, input_element):
        """Test type_text with empty string."""
        input_element.click = AsyncMock()
        await input_element.type_text('')

        # Should not call execute_command for empty string
        input_element._connection_handler.execute_command.assert_not_called()
        assert input_element.click.call_count == 1

    @pytest.mark.asyncio
    async def test_set_input_files_empty_list(self, file_input_element):
        """Test set_input_files with empty file list."""
        await file_input_element.set_input_files([])

        expected_command = DomCommands.set_file_input_files(
            files=[], object_id='file-input-object-id'
        )
        file_input_element._connection_handler.execute_command.assert_called_once_with(
            expected_command, timeout=60
        )


class TestWebElementGetChildren:
    """Integration tests for WebElement get_children_elements method using real HTML."""

    @pytest.mark.asyncio
    async def test_get_children_elements_basic(self, ci_chrome_options):
        """Test get_children_elements with basic depth using real HTML."""

        # Get the path to our test HTML file
        test_file = Path(__file__).parent / 'pages' / 'test_children.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)

            # Find the parent element
            parent_element = await tab.find(id='parent-element')

            # Test get_children_elements with depth 3
            nodes = await parent_element.get_children_elements(3)

            # Verify results - should get all direct children and nested children up to depth 3
            assert len(nodes) > 0
            assert all(isinstance(node, WebElement) for node in nodes)

            # Check that we have the expected direct children
            child_ids = []
            for node in nodes:
                node_id = node.get_attribute('id')
                if node_id:
                    child_ids.append(node_id)

            # Should include direct children
            expected_direct_children = [
                'child1',
                'child2',
                'child3',
                'link1',
                'link2',
                'nested-parent',
            ]
            for expected_id in expected_direct_children:
                assert (
                    expected_id in child_ids
                ), f"Expected child {expected_id} not found in {child_ids}"

            # Should also include nested children (depth 3)
            expected_nested_children = ['nested-child1', 'nested-child2', 'nested-link']
            for expected_id in expected_nested_children:
                assert (
                    expected_id in child_ids
                ), f"Expected nested child {expected_id} not found in {child_ids}"

    @pytest.mark.asyncio
    async def test_get_children_elements_with_tag_filter(self, ci_chrome_options):
        """Test get_children_elements with tag filter using real HTML."""

        # Get the path to our test HTML file
        test_file = Path(__file__).parent / 'pages' / 'test_children.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)

            # Find the parent element
            parent_element = await tab.find(id='parent-element')

            # Test get_children_elements with tag filter for 'a' tags
            nodes_filter = await parent_element.get_children_elements(4, ['a'])

            # Verify results - should only get anchor tags
            assert len(nodes_filter) > 0
            assert all(isinstance(node, WebElement) for node in nodes_filter)

            # Check that all returned elements are anchor tags
            for node in nodes_filter:
                tag_name = node.get_attribute('tag_name')
                assert tag_name.lower() == 'a', f"Expected 'a' tag, got '{tag_name}'"

            # Check that we have the expected anchor elements
            link_ids = []
            for node in nodes_filter:
                node_id = node.get_attribute('id')
                if node_id:
                    link_ids.append(node_id)

            # Should include both direct and nested anchor tags
            expected_links = ['link1', 'link2', 'nested-link']
            for expected_id in expected_links:
                assert (
                    expected_id in link_ids
                ), f"Expected link {expected_id} not found in {link_ids}"

    @pytest.mark.asyncio
    async def test_get_children_elements_depth_limit(self, ci_chrome_options):
        """Test get_children_elements with depth limit."""

        # Get the path to our test HTML file
        test_file = Path(__file__).parent / 'pages' / 'test_children.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)

            # Find the parent element
            parent_element = await tab.find(id='parent-element')

            # Test with depth 1 - should only get direct children
            nodes_depth_1 = await parent_element.get_children_elements(1)

            # Get IDs of elements found with depth 1
            depth_1_ids = []
            for node in nodes_depth_1:
                node_id = node.get_attribute('id')
                if node_id:
                    depth_1_ids.append(node_id)

            # Should include direct children but not nested ones
            expected_direct = ['child1', 'child2', 'child3', 'link1', 'link2', 'nested-parent']
            for expected_id in expected_direct:
                assert expected_id in depth_1_ids, f"Expected direct child {expected_id} not found"

            # Should NOT include nested children with depth 1
            unexpected_nested = ['nested-child1', 'nested-child2', 'nested-link']
            for unexpected_id in unexpected_nested:
                assert (
                    unexpected_id not in depth_1_ids
                ), f"Unexpected nested child {unexpected_id} found with depth 1"

    @pytest.mark.asyncio
    async def test_get_children_elements_empty_result(self, ci_chrome_options):
        """Test get_children_elements on element with no children."""

        # Get the path to our test HTML file
        test_file = Path(__file__).parent / 'pages' / 'test_children.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)

            # Find a leaf element (no children)
            leaf_element = await tab.find(id='child1')

            # Test get_children_elements on element with no children
            nodes = await leaf_element.get_children_elements(2)

            # Should return empty list
            assert isinstance(nodes, list)
            assert len(nodes) == 0

    @pytest.mark.asyncio
    async def test_get_children_elements_element_not_found_exception(self):
        """Test get_children_elements raises ElementNotFound when script fails."""
        # Create a mock element that will fail the script execution
        mock_connection_handler = AsyncMock()

        # Mock script result without objectId (simulates script failure)
        mock_connection_handler.execute_command.return_value = {
            'result': {'result': {}}  # No objectId key
        }

        # Create a WebElement with the mock connection
        element = WebElement(
            object_id='test-element-id',
            connection_handler=mock_connection_handler,
            attributes_list=['id', 'test-element', 'tag_name', 'div'],
        )

        # Should raise ElementNotFound when script returns no objectId
        with pytest.raises(ElementNotFound):
            await element.get_children_elements(1, raise_exc=True)

    @pytest.mark.asyncio
    async def test_get_siblings_elements_basic(self, ci_chrome_options):
        """Test get_siblings_elements with basic functionality using real HTML."""

        # Get the path to our test HTML file
        test_file = Path(__file__).parent / 'pages' / 'test_children.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)

            # Find one of the child elements to get its siblings
            child_element = await tab.find(id='child2')

            # Test get_siblings_elements
            siblings = await child_element.get_siblings_elements()

            # Verify results - should get all sibling elements
            assert len(siblings) > 0
            assert all(isinstance(sibling, WebElement) for sibling in siblings)

            # Check that we have the expected siblings
            sibling_ids = []
            for sibling in siblings:
                sibling_id = sibling.get_attribute('id')
                if sibling_id:
                    sibling_ids.append(sibling_id)

            # Should include all siblings of child2 (child1, child3, link1, link2, nested-parent)
            # but NOT child2 itself
            expected_siblings = ['child1', 'child3', 'link1', 'link2', 'nested-parent']
            for expected_id in expected_siblings:
                assert (
                    expected_id in sibling_ids
                ), f"Expected sibling {expected_id} not found in {sibling_ids}"

            # Should NOT include the element itself
            assert 'child2' not in sibling_ids, "Element should not include itself in siblings"

    @pytest.mark.asyncio
    async def test_get_siblings_elements_with_tag_filter(self, ci_chrome_options):
        """Test get_siblings_elements with tag filter."""

        # Get the path to our test HTML file
        test_file = Path(__file__).parent / 'pages' / 'test_children.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)

            # Find one of the child elements to get its siblings
            child_element = await tab.find(id='child1')

            # Test get_siblings_elements with tag filter for 'a' tags only
            siblings_filter = await child_element.get_siblings_elements(tag_filter=['a'])

            # Get IDs of filtered siblings
            sibling_ids = []
            for sibling in siblings_filter:
                sibling_id = sibling.get_attribute('id')
                if sibling_id:
                    sibling_ids.append(sibling_id)

            # Should include only anchor tag siblings
            expected_links = ['link1', 'link2']
            for expected_id in expected_links:
                assert (
                    expected_id in sibling_ids
                ), f"Expected link sibling {expected_id} not found in {sibling_ids}"

            # Should NOT include non-anchor siblings
            unexpected_siblings = ['child2', 'child3', 'nested-parent']
            for unexpected_id in unexpected_siblings:
                assert (
                    unexpected_id not in sibling_ids
                ), f"Unexpected non-anchor sibling {unexpected_id} found with tag filter"

    @pytest.mark.asyncio
    async def test_get_siblings_elements_empty_result(self, ci_chrome_options):
        """Test get_siblings_elements on element with no siblings."""

        # Get the path to our test HTML file
        test_file = Path(__file__).parent / 'pages' / 'test_children.html'
        file_url = f'file://{test_file.absolute()}'

        async with Chrome(options=ci_chrome_options) as browser:
            tab = await browser.start()
            await tab.go_to(file_url)

            # Find the parent element which should have no siblings at its level
            parent_element = await tab.find(id='parent-element')

            # Test get_siblings_elements on element with no siblings
            siblings = await parent_element.get_siblings_elements()

            # Should return list with only the other parent element as sibling
            assert isinstance(siblings, list)
            # Should have at least one sibling (another-parent)
            sibling_ids = []
            for sibling in siblings:
                sibling_id = sibling.get_attribute('id')
                if sibling_id:
                    sibling_ids.append(sibling_id)

            # Should include the other parent element
            assert 'another-parent' in sibling_ids

    @pytest.mark.asyncio
    async def test_get_siblings_elements_element_not_found_exception(self):
        """Test get_siblings_elements raises ElementNotFound when script fails."""
        # Create a mock element that will fail the script execution
        mock_connection_handler = AsyncMock()

        # Mock script result without objectId (simulates script failure)
        mock_connection_handler.execute_command.return_value = {
            'result': {'result': {}}  # No objectId key
        }

        # Create a WebElement with the mock connection
        element = WebElement(
            object_id='test-element-id',
            connection_handler=mock_connection_handler,
            attributes_list=['id', 'test-element', 'tag_name', 'div'],
        )

        # Should raise ElementNotFound when script returns no objectId
        with pytest.raises(ElementNotFound):
            await element.get_siblings_elements(raise_exc=True)


"""
Tests for WebElement iframe edge cases and uncovered code paths.

This test suite focuses on covering edge cases in iframe resolution and context handling,
including:
- inner_html edge cases for iframes and iframe context elements
- Frame tree traversal and owner resolution
- OOPIF resolution scenarios
- Isolated world creation failures
- Document object resolution failures
"""

import pytest
import pytest_asyncio
from unittest.mock import AsyncMock, patch

from pydoll.elements.web_element import WebElement
from pydoll.interactions.iframe import IFrameContext
from pydoll.connection import ConnectionHandler
from pydoll.exceptions import InvalidIFrame


@pytest_asyncio.fixture
async def mock_connection_handler():
    """Mock connection handler for WebElement tests."""
    with patch('pydoll.connection.ConnectionHandler', autospec=True) as mock:
        handler = mock.return_value
        handler.execute_command = AsyncMock()
        handler._connection_port = 9222
        yield handler


@pytest.fixture
def iframe_element(mock_connection_handler):
    """Iframe element fixture for iframe-related tests."""
    attributes_list = ['id', 'test-iframe', 'tag_name', 'iframe']
    return WebElement(
        object_id='iframe-object-id',
        connection_handler=mock_connection_handler,
        method='css',
        selector='iframe#test-iframe',
        attributes_list=attributes_list,
    )


@pytest.fixture
def element_in_iframe(mock_connection_handler):
    """Element inside an iframe (has _iframe_context set)."""
    attributes_list = ['id', 'button-in-iframe', 'tag_name', 'button']
    element = WebElement(
        object_id='button-object-id',
        connection_handler=mock_connection_handler,
        method='css',
        selector='button',
        attributes_list=attributes_list,
    )
    # Set iframe context to simulate element inside iframe
    element._iframe_context = IFrameContext(
        frame_id='frame-123',
        document_url='https://example.com/iframe.html',
        execution_context_id=42,
        document_object_id='doc-obj-id',
    )
    return element


class TestInnerHtmlEdgeCases:
    """Test inner_html property edge cases for iframe scenarios."""

    @pytest.mark.asyncio
    async def test_inner_html_iframe_element_with_context(self, iframe_element):
        """Test inner_html on iframe element uses Runtime.evaluate in iframe context."""

        async def side_effect(command, timeout=60):
            method = command['method']
            if method == 'DOM.describeNode':
                return {
                    'result': {
                        'node': {
                            # Simula um iframe de mesma origem já com frameId
                            # resolvido; não precisamos de backendNodeId aqui,
                            # pois não queremos acionar a resolução OOPIF.
                            'frameId': 'parent-frame',
                            'contentDocument': {
                                'frameId': 'iframe-123',
                                'documentURL': 'https://example.com/frame.html',
                            },
                        }
                    }
                }
            if method == 'Page.createIsolatedWorld':
                return {'result': {'executionContextId': 77}}
            if method == 'Runtime.evaluate':
                expression = command['params']['expression']
                if expression == 'document.documentElement':
                    return {
                        'result': {
                            'result': {
                                'type': 'object',
                                'objectId': 'doc-element-id',
                            }
                        }
                    }
                if expression == 'document.documentElement.outerHTML':
                    return {
                        'result': {
                            'result': {
                                'type': 'string',
                                'value': '<html><body>Iframe content</body></html>',
                            }
                        }
                    }
            raise AssertionError(f'Unexpected method {method}')

        iframe_element._connection_handler.execute_command.side_effect = side_effect

        # Get inner HTML of iframe element
        html = await iframe_element.inner_html

        # Should return iframe's document HTML
        assert html == '<html><body>Iframe content</body></html>'

        # Verify Runtime.evaluate was called with correct context
        evaluate_calls = [
            call
            for call in iframe_element._connection_handler.execute_command.await_args_list
            if call.args[0]['method'] == 'Runtime.evaluate'
        ]
        # Should have two calls: one for document.documentElement, one for outerHTML
        assert len(evaluate_calls) == 2
        outer_html_call = evaluate_calls[1]
        assert (
            outer_html_call.args[0]['params']['expression']
            == 'document.documentElement.outerHTML'
        )
        assert outer_html_call.args[0]['params']['contextId'] == 77

    @pytest.mark.asyncio
    async def test_inner_html_element_in_iframe_uses_call_function_on(self, element_in_iframe):
        """Test inner_html on element inside iframe uses Runtime.callFunctionOn."""
        element_in_iframe._connection_handler.execute_command.return_value = {
            'result': {
                'result': {
                    'type': 'string',
                    'value': '<button id="button-in-iframe">Click me</button>',
                }
            }
        }

        html = await element_in_iframe.inner_html

        # Should use callFunctionOn with this.outerHTML
        assert html == '<button id="button-in-iframe">Click me</button>'
        element_in_iframe._connection_handler.execute_command.assert_called_once()
        call_args = element_in_iframe._connection_handler.execute_command.call_args[0][0]
        assert call_args['method'] == 'Runtime.callFunctionOn'
        assert call_args['params']['objectId'] == 'button-object-id'
        assert 'this.outerHTML' in call_args['params']['functionDeclaration']

    @pytest.mark.asyncio
    async def test_inner_html_element_in_iframe_empty_response(self, element_in_iframe):
        """Test inner_html on element inside iframe when response is empty."""
        element_in_iframe._connection_handler.execute_command.return_value = {
            'result': {}  # Empty result
        }

        html = await element_in_iframe.inner_html

        # Should return empty string when result is missing
        assert html == ''

    @pytest.mark.asyncio
    async def test_inner_html_regular_element_fallback(self, mock_connection_handler):
        """Test inner_html falls back to DOM.getOuterHTML for regular elements."""
        attributes_list = ['id', 'regular-div', 'tag_name', 'div']
        element = WebElement(
            object_id='div-object-id',
            connection_handler=mock_connection_handler,
            attributes_list=attributes_list,
        )
        mock_connection_handler.execute_command.return_value = {
            'result': {'outerHTML': '<div id="regular-div">Content</div>'}
        }

        html = await element.inner_html

        # Should use DOM.getOuterHTML for regular elements
        assert html == '<div id="regular-div">Content</div>'
        call_args = mock_connection_handler.execute_command.call_args[0][0]
        assert call_args['method'] == 'DOM.getOuterHTML'